diff --git a/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..431805f2a532ab6e17fcf161d50d9031baabfba3 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.3562210829072388, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06363294711119734}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.11009512311383156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020727913604168193}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.16243977504759669, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002228768903465126}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.12013040778127415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017746386859163203}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.016237573503050346, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005791686929917277}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.027893395046500822, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001039576769487543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.01952192502751282, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007045263606140751}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.10534269523932902, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018942650621943632}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.1589275088375994, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021856832752487143}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.1164630301972042, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016922702496737136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.09138176673759738, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016976459528528838}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.13851750677859065, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001981721576730165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.1010326136243227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015162989057978518}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..20dcc1cfc5f608dc2c1119c43b3e53fc22f92baf --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16625735855106855, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024463651813182914}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3230884270864929, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004359311826645138}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20872501710774183, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025765264814385574}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03520681144190837, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013363705236252219}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07441126206565717, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027685648685041907}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04541415352191168, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016019047132235528}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12527352638980324, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018832520008059408}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24649639309519972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035131508278542895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15771639364031548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001968467651802171}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12771639136222968, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001971864037023057}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2517880179492348, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003783114418327505}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16106544122061872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002144088469758669}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.036660647928376, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0886671989991428}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad516e595704a7d3e55f480bae76f7c9f7b196a --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/agg.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13473651953646212, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018830579225946448}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33263109371075555, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0043737298284748935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18955906449065837, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025437030392446553}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02979980903695056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010699057640840117}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07661622521673665, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00277147224226074}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04240941625507146, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015134151293483083}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10545507286869261, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014282925798028265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2622174946749768, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034532690725241335}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14860417887228614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019427079439186818}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10644896438074114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015535641404371687}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26570822729983273, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003832781853814249}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1502154921172796, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021382854049990575}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6913128558245667, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09521771990115542}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f49303e57c20369b7c0c1008e626bfe86e4a4a45 100644 --- a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl +++ b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acf9e32092153cf8f0af5c91853b34d9b865cdebba19399b5ad1f802f36bb55 +size 4454140 diff --git a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..69697b8fd701fb6562d1ad05d67201628920cf1e 100644 --- a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.jsonl +++ b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed45a900f08a095774f6f224b39bd55c362922ea32bc8f0c0bd18cef7b82e73a +size 2788220 diff --git a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..03915bee7075e90b7e0f080eb60f81a37d6a3710 100644 --- a/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.jsonl +++ b/4b284b17bc4seed2/evaluation/generation/examples.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81016c90af5ffef779f0cb474c304822fd5faf4d585ef531961dff3876ada5a4 +size 5106203 diff --git a/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c81f4e72ec6ee7801bac04aafa6b251db3417658 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.3562210829072388, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06363294711119734 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.11009512311383156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0020727913604168193 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.16243977504759669, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002228768903465126 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.12013040778127415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017746386859163203 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.016237573503050346, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0005791686929917277 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.027893395046500822, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001039576769487543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.01952192502751282, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0007045263606140751 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.10534269523932902, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018942650621943632 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.1589275088375994, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021856832752487143 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.1164630301972042, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016922702496737136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.09138176673759738, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0016976459528528838 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.13851750677859065, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.001981721576730165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.1010326136243227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015162989057978518 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..484ae537b657245bbc85f41d09de8859ec1be26b --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16625735855106855, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024463651813182914 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3230884270864929, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004359311826645138 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20872501710774183, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025765264814385574 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03520681144190837, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013363705236252219 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07441126206565717, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027685648685041907 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04541415352191168, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016019047132235528 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12527352638980324, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018832520008059408 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24649639309519972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035131508278542895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15771639364031548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001968467651802171 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12771639136222968, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001971864037023057 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2517880179492348, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003783114418327505 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16106544122061872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002144088469758669 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.036660647928376, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0886671989991428 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..025af15a08387939710f8d6df85dfd1faeccd5f0 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/generation/slim.4b284b17bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13473651953646212, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018830579225946448 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33263109371075555, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0043737298284748935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18955906449065837, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025437030392446553 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02979980903695056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010699057640840117 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07661622521673665, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00277147224226074 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04240941625507146, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015134151293483083 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10545507286869261, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014282925798028265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2622174946749768, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034532690725241335 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14860417887228614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019427079439186818 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10644896438074114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015535641404371687 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26570822729983273, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003832781853814249 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1502154921172796, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021382854049990575 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6913128558245667, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09521771990115542 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b17bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0db515d5c15572664f8af27765aaa8a8bcf226a0 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811482 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928366 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767789 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.20817204301075268 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0_lm-eval_global_step80108_2023-02-26-09-23-54_0shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0_lm-eval_global_step80108_2023-02-26-09-23-54_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0db515d5c15572664f8af27765aaa8a8bcf226a0 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_0_lm-eval_global_step80108_2023-02-26-09-23-54_0shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811482 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928366 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767789 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.20817204301075268 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..891ff640321c5d33398d631462ea69de1639e6b9 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.31, + "acc_stderr": 0.0146326386586329 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738852 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002517 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.33520950594121324 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1_lm-eval_global_step80108_2023-02-26-09-23-54_1shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1_lm-eval_global_step80108_2023-02-26-09-23-54_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..891ff640321c5d33398d631462ea69de1639e6b9 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_1_lm-eval_global_step80108_2023-02-26-09-23-54_1shots_backup.json @@ -0,0 +1,32 @@ +{ + "results": { + "anli_r1": { + "acc": 0.31, + "acc_stderr": 0.0146326386586329 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738852 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002517 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.33520950594121324 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..73544308ed7e49dffefe988c69c6326fddf615c7 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2.json @@ -0,0 +1,16 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934644 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2_lm-eval_global_step80108_2023-02-26-09-23-54_2shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2_lm-eval_global_step80108_2023-02-26-09-23-54_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..73544308ed7e49dffefe988c69c6326fddf615c7 --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_2_lm-eval_global_step80108_2023-02-26-09-23-54_2shots_backup.json @@ -0,0 +1,16 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934644 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4e6a9bd14d06c3e535350ffdf2ea82f781eca22d --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3.json @@ -0,0 +1,16 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928366 + }, + "anli_r2": { + "acc": 0.327, + "acc_stderr": 0.01484221315341125 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3_lm-eval_global_step80108_2023-02-26-09-23-54_3shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3_lm-eval_global_step80108_2023-02-26-09-23-54_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..4e6a9bd14d06c3e535350ffdf2ea82f781eca22d --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_3_lm-eval_global_step80108_2023-02-26-09-23-54_3shots_backup.json @@ -0,0 +1,16 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928366 + }, + "anli_r2": { + "acc": 0.327, + "acc_stderr": 0.01484221315341125 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c72a9830d4dac0fd5aa2afaa76123b267cf7975a --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4.json @@ -0,0 +1,11 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811487 + } + }, + "versions": { + "anli_r1": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4_lm-eval_global_step80108_2023-02-26-09-23-54_4shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4_lm-eval_global_step80108_2023-02-26-09-23-54_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c72a9830d4dac0fd5aa2afaa76123b267cf7975a --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_4_lm-eval_global_step80108_2023-02-26-09-23-54_4shots_backup.json @@ -0,0 +1,11 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811487 + } + }, + "versions": { + "anli_r1": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..84d60b9fa950d932dc8e79b40755d5dcd71ba20f --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5.json @@ -0,0 +1,11 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + } + }, + "versions": { + "anli_r1": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5_lm-eval_global_step80108_2023-02-26-09-23-54_5shots_backup.json b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5_lm-eval_global_step80108_2023-02-26-09-23-54_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..84d60b9fa950d932dc8e79b40755d5dcd71ba20f --- /dev/null +++ b/4b284b17bc4seed2/evaluation/rankeval/4b284b17bc4seed2_5_lm-eval_global_step80108_2023-02-26-09-23-54_5shots_backup.json @@ -0,0 +1,11 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + } + }, + "versions": { + "anli_r1": 0 + } +} \ No newline at end of file diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3db52ef6818fd35a20e9b9c7143a1e817117c98 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19f4f6717cfa11f4089167db24b0b29e1bb2817134064bb874840168067714c +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab525db474413e9e2a4d66938374fbff14781502 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:297b32a72bba9aa49c9537d880b9787a5a35eb47181f7deefe32272e4465cef4 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d484350cc1eec5febd0eff72ad552410d8c403f5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2e6eedb9bc9bd97ec987fb7464df3040b9d475ee75ef384a04ca6722ab85c7 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcaccb5a537c372312e890d08485437431413095 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e485b0b011011d03e037d0907626277584d572ad497e420af521594b14d312 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85b4f63ade28aca72fb706c12d226621e866a8ab --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd8c889e122a013bb966eb95ba0f0f8234ff81cf1364b05640560685be06e040 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54af3a403b48f1649842af6308eee0ff775a1563 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01595dc0b077c8e72f618d8fd19c9268d9c3a26f2e6b17a1bd3e3ec765d46b09 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7768ddeaf95ebdd3b64316399e49e351b55da2bb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4f5a39d584e098799a59a3372814f01ec9420c4ba42739b075b1c068033dd6 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6f388c9dfbc9461a20cfa4de487e0b2c2029e1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c622f72f8dd7644bc87c234d480488be11ba94b1ba0ef4aa7ad95ff3cbc68d +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f0bd9a3400628b0f4f02440e47ee04b230023b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90660386a82d21ec7cf70295a7c3a408a41512f1f4b4024778660c298b13888 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29cbb52c6a3bbe99b57a5c720e1363c4e030a54b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02315f4f1c48bbbbd3d3cccd3ad5aea92f6fd004b6d5bd191fe78c442895bb48 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e938af2fb7f272e3acde9ce5da9b156a57034959 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e0ad698781c5c8c63cefc365a36a9adc5156770cf5181b65b0ec09228fd37d +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76c8ef52323bed5d7bdf4a92f108381408492bb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2774f3874f8dba8200a6104a5debf22a883f11e0120b4c60666423653e01c6e +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7598ed011c228c40be6f8a1e177be1a042530df8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28fdd8002c30266f396cb23ed293aab7ec62d6c1470841c93e06dcc8a3db3c24 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c60f93f40488aa49f8122949d590124e676ad22 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff146a02f2012093b98d6a4d6b43107582c7d22febd5f3bcb987428070b3575f +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f9d851aa8cbe2ccae0f518755d07b623ae901f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e524180750e5069192c18ed03de65c1423ef06d21ade032cbb2a284fb351d745 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e3381aac55e4c07b344ad0777adf021bb469b0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c84e8469b70d872f85a6dee37e0f435241473def04ecd19c43154d2f3c4b4f0 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e4da54c7679c6b92b815bc4a0ac3e9ba72bbb8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63eea16c8b46dcac2761d4c1815598f7c3f06ffaeb9414179ad3702a9119fb31 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7702b4cea77dd8d4996ed3935242fddbd54134ed --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34b2fe2d547558d51c69b8a2beb3e108bed088e2c1b34c9c0917272aba4b797 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a02848c968dad510bcfb7d3a3d9368330b718f81 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd152095fe9200af67618d01205c2b6750cbc6397927eefc3239e567229a894d +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d3e82d25bc71be3f00f35c1a1a0272039f57cfc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e26143bcc52fd589e27998e0770905dd02c6d0e0688f40e37ce8eb05af2d0b +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90aef29c3333d580ad29fa21969e90c2f8b2eeed --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5f77213756b50fa3818c545bb0408288e9716392636ef535cecf64bb4a268c +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3c946edfddaa5e192d21d1d72953b6938baedc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2712850a994a27a466457b619ca2b2424e662a10ff15fe9a87f4384de75ec13b +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f7935658f18dc10ad1adb5daceb15d1cca747f8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f757ac808f925c5090c7eea98f335b981638738c829df8cef1dee8c9bbdb720 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82152acf93bf279b05691e671607735552297b3c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dea9ecc09ae6dae0b1e7b1373c745e329724bd0b9ff2a07af3b4ff4451f46c1 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a33f03c9e8d8584dc49607d527838842a8f9f048 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f213727a59089773f69e4a576a4fb43a8ed8fe2f53d06ba127e533436aed464 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69cdf183e4cdf0c21f8a712e8e82046d357e96c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc5d89562938d153423a014a48bdf96cca8a240121e59262de84635df48e1de3 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7adf79ed421b3b698c7e8ad461c379dd8f50609 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e2b99c559d05f4acab047632c8aa03a50d4fab2a8546054d856bc676aa3623 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5131399e92c35df0ac46c94cb8233709edb391 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2dfb6e3f6beaee5bd8a62b45042d3f5b312d0544b917a136da14291a94ee3ae +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..632c7d42a2444306484a93dc58f22bf7a35a9d75 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec70fb5940e8e482dfad0d1383c93027356292f24b5b11d0299e6f832cc6603 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89e0d83441efe17d5af776a5676b32a78000efd --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685dd93ff6df146b541ac260e74099b31a3d5e03dbf0d6029a96f1aa4bc036e1 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f8c20d3a0e7695e5d1dfec2d224879732aec5c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68bc067a8f9904d55db051addad3745281bf362bf78dbbb5823d25b9a31b4ae1 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f60b3f048f59b289d47c9e1496632b8a555b8c78 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e4ea4c6d9235b4280f46413dc2d7c317febeaf6b5a208c2d75366ee47f9bcc +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a30735f05a909a76fee627f2c975a1ceeba2bcf --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ab8ae5e5daf77c7770ead8b642a0771826eb8e21239b758d473ef7e975eefb +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d198df0a2d0d3ce774ea164dced9b64145f4fe --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250af9d46ba8c82a838e95be43b9c2674c1e59bbc4ad01876372cbc1afa6ff9a +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be5d9c86b5d52ed47aaa22e45da8a3bf1f5c49d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9de381585ee830d97d4baea8845ed6ee38c35abd6c5a71716ade073afc63b5b +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d2bb9265dc1f88de509c67e8be37b43b87cf3fd --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c409ba49d77c1b8d8383b9d55430c3d25afc7a6a5869a3c02b65edb9025fb7 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22c28bc6868949b9e8136d0fcef24737af592950 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0bbc2cc500a0819aa4dcfe93c395e13e6075225eb1f7da89261cd2ecf9aad6 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81289d083582222317d33d80a5916be6f7455057 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed065ebca37f753abeb0221ff52cd4febb4b05ca757466c4c704b7c341175e6b +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77905f6478535423a530824ecb9b36b57f9356d8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a1b31411b84812004e6f6745e63262977a56292de916e8400e993fe996ffaa +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61e7e0ec03f0e558e99502c993c98d7adccf6ee8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d39357c309fcc76f6bf852fffd450b89f283ca5e329ab49fe85105df5891ba +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ca3d5c305963718d708f9dc6e89ad13017f095d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff486bd94bbfdba08f16e479b58c85916ab3f043c4f9a3092d0f42b842931cfb +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e024225ede424975cb79c761a4542579e6f3ae01 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac7c327d946ed4b87729cf014886d050d5e57c8aefb86334da91a30f704b0e8 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e9ce143341ef6ec91bf82064194a112e082ae02 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f4ff16a4f6ed8c63cfd359e56eff9a17c9430362003b6ebf820bc4aab9349a +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..847c8b77119f669bf0f6a65333c55fa4873cd7ee --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc1e4ba79ec008182ca562ee9e4299dfdb5c6c2d797c2f3a9e260d166e38ca3 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..905c2de14d6e3bac098f281f83515d5fe3cf6737 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f0c4515c9b42a85731e919dc729d2e531f364a4f741806041b0cc282e6a109 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..320df985f3a04c6db990262de4bb7ed55ab02ca1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568db6055273e3dbe7d343787ab4fead169efd21a536be6aed276ec5fb9bac81 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1a104468dea861f9a57ba705910edc7a9a0ad53 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7aed95f8982b0277ffbca660283a0c908d450da9eea1788283ab3121c7d5b88 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad8470c6f2a5aad902e1f843b89914cf9828cbe --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36121abd91218f5947558bb603f0ab7b044901c7afe0112ee2f20e6c231538d3 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96cd2bbd0b61724ed6f0129099514911ad818fb3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73db6a3f70c0a91af40d59816efd9856064db13a4fd79b9dbe03a47ed9ca16cd +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1150fae33ca857c6ca25b3d49ddd64da6689b3a6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b7a04284ab318f45bc9f2bab3066f3af57b17bf2698e24c906629d871669e7 +size 199058797 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa28fb8aed4c3ee2d5059a74537991c9c4c2dfd8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e435399b47fe0c2ad90f7e5164d958ae37a62db0493c1ec943d1fe091060d3a +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b4f2b2ba30baa4ddcb0033597b3ca6161ca593e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6c959d3af2c9b34d23fd95bd1293588f5419c7fddd04a8fb3290fd9549cb0d +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6c50664a1298bdc0921df765fb6e11443b4ddf --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc0d4826b10623b620f3132b5e69766d8bc98aedecdc5ebbfe92976222abf85 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15931bea6a69bf6ccd98a396cb28d7a81a832b33 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d4a3424c15ea18d7f334f9240828f974555163bcf94eb191d070fa863a05d3 +size 199058733 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2debc52d534264f58df2d768658f4a6f92176f24 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15c5f0b33372e0f4fe1d291e462220c5be01cf1478c19a099e784c8453124bd +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d434691c46dd40004b9633f9f8bd0d53011a92f7 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0aa4202f0576ebada1a00126697d72e809703bee1900555094a8c3693af98c5 +size 199058669 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd3445fded99ee459eea22a63a3532194d11fac --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07da1d2738de9b6b6641e12bd24f1a2672e3e4840eee32c2583395567e4a5381 +size 199058925 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b6c07c35c4ae7f043d5fa69049ee3844e2f09cf --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b28cb3f30b890de716ea4c41ae0a39f9542623ec68508d7dee3086f58e697c +size 199058925 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee3d00d1e348c42121648596c39d28c2371947d5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087ae765d24fc56dcd32da7f4a2c710adb9c9a0e6ce41bd88d189ed4d86da511 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef490c888e5c53344cb5f3bb9f6f0eaa31a197c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c0c5f6ca60532422c4dbebfe7dc779485db1c7285f4cc2747e2766a9fe8973 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc67e0ae4701a32f7446d0a4ff86f9f41cef35c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27c76216ea811ee821ad0d09ca6533686371dc9d9140178ef9c7dff88749447 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05f71bbe6c4cb9cb4d8b2f39761a531067b6b0b6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892d5489435e26a7fd9a479e62fce568ca9433420742bff39f112d7659a57098 +size 199058605 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c568ea9ab7739e40b63231cec275bffb16e5de04 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e455f054d086367ca3e29d772bf89ffac39c7fe238123b8a85743600eab6f7b5 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e1ccf037dc78172399fcfddaa069a11c242fab --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e0671954b0fe151eda1038be70dbcacff591a1f704d975be71b55c9984e9e2 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d1dded8aa07bb35670b5da482c81725102cac2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e5e2a289bfbe910837a4a69c2d39a0a810f36129a7f56d24f22f4195d8e3d6 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39aa62966ec0bdb47373572a02587efd3949c3e0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae6fda67c864431ccd12358a1ca53133b0fae30918e1b92e1059156c22c52d1 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..274429babc10d5ad7a747ee4356e044bc41d6137 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7620c256aef85292489d6ecf36670fae066bccab86fa20d50d675954aee1d41 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06a9c8d30b47fdb3a7c8e235d886b35a5a34307f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37bea76157df589a7fa4335506b4561f7ce8ec8d00dd12b322de318965d2c118 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c50875b9cdf06532b729298345054b078a34dd1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32833b2a17f03150d154fc8e12f95b3c0198f3b5a7af5105d8a4649f13bdfbb2 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abc1efc5cbad7da52e5c65754e34da605090df92 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd967d8e0c612d131ffc9fe7cb86373c6e481b58194abce29706f2eee930fee +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca19e85ce300b7c8dfe7286acab4647a2b54c0e9 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170b44538fd304e19e2315f5662c55dd492d267b58a0b70a99604f6daa1a0f0e +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5f8dee307da7df0eb0452b1a4a858bfe61b8dc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67b15a180540f89b33ea24eaaaff335d69c13a7b98b16d464d0f35a7df575d5 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..754d5475197255988e4724b11464e5ef7e9c3ccd --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3eebe21da79ebc6546db9d80939b4b9039d747504e2c543d9209b6f27a97e26 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3897cdaff0d4cf0a8086f5eba83bcb150762f4b5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc91f4ddbae57fdbbf33843d9d8d29be5d9948ac1ebe325fe99f1bf36d093af +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4282e12185a715bc31779b98cfa8f8c9a2c2a197 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c64216d8db2c69d33b23fd3bec0d8ed17e4f329b80ea314ef8f874a3e7481a3 +size 199058978 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..525f14e37cb2450cbc820968c18e9cd97a80bd34 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb8afcec8433ae82fc3ef423bb50be961252a466e1002ba238ebfccc0d984dda +size 199058978 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..768e0876d04757f5cabc07ebfec3a5b3481f83dc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd1bae704cf5452838041256419ae9b2c03fd1d0ff94e36690c604d72d70f28 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ede426952d27735fd7127fd532a25da2bbbb60 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbc7b6995d963041e12b878b45ce411723559d23d4645760d23d4a010775d44 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0196c355998c8c65dcda859c8c76cb0fe42dc393 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928f1c5134a9cf45eb5c53c77a77ed773f7493ae2fa4fa1edc8f2c586303d979 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e92b9adc797325f56851d25667b74b344932c304 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4fb3cae55176ace8c564894eb2debde1d0e73911648cc5ef4fe69dde3857c4d +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e2556b59721a4fe4c737af9b4d11bf196d64b6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b512c7cfc7200c530cc6250d36914211f245b7a7c0fefc9fc4b480ab763416 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3bf97213e58d064d90e6f50990f065f076ef843 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ae4d63fa3f6a8a7c7a3955e9827bf84bdb18fdd9cf24ace7aef56b5ad13719 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ced8994756227c6e8e3e95e5b079fb3c06258504 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021eeda49689ade787021ff51ac2e410cdf47d416246a1b1ae2b4892ca27e2a9 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70a8cb8e89878bad314770250893836776af4a4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56a6ec7069afe160c90ab21b31aef87cf94d57a04469f28dbef641d6d2d6140 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1955293d8632d8e0924a60fcbb1936b1bb7d9d04 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b532f490430a1093c8eba27cd871a2192e707ad2572599cac9796d43966c55 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c42788a94f459613cda7e8815ee32256521da666 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1636222c2ef8c7cfb27f956b0aa7118d2c04f410c6b4829aec0392296d29879 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d7bc9072cf111a40df03bf4436f75aac4062b5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63fd149e05b8ff477e1e8d259bb1ab3d77d64c3dd9f78068797c6a145a55c938 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe933d147a5dde4618b11fe9d885d4d88bf698fa --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b444867493a5b0f1c6f07deb2e2da3bc22e1525ae38d4d7c8cb347925fc1982 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0acf2f7333dedc0ad710954f96e5689dd13218fc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3774914676f9bfb1e1f796063bfe7348cba752955a11fd2354175ddfb0a4f357 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f5e259049b26e63b6e50ab08cc01f531e5218e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fc7de3740e970417afeff1e6d3f1d92c09a597c32356e8413898cca4465222 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c2b169ff185d178493aff264f85355033d1b9fc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65449fc90f9d758ac85128e26e9e0689602a6e102fa069c2114c4c64f6861e92 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0503b2692ef31c60fef86598bf85041a98c29f15 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6d6fc6dd20e08ef4875a99372a55d60ff2b1abc5da8f9b88444a5431dd4603 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1144d6704caa4b3e56f51252a024e31d08d4a90a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf98c2b100601b4c783107645942949d03e04af35b861bfc3b37330d3819e19 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..589e1b5df0c9ad4969c35a75e9db7e2271509d68 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea6325bab8485f0859e38ab09b6b4e5645c9dab649948d2a0c8f8dd5af0cf6f +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4fc3c7d96220db677386c7763342c4bfc36645 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c5b4e5726b182970bc967c04e5382dbdafa4d275c91848cc61b58ca845985b +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e973ccec882a604f24d53e1c23f6659ecb726f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834094cfdbadba6abc4adcb34c4f7aca6ceb043097775935870a3cfbfe8a07f3 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70693eb0c3b38f0093c5d7cbb69fbe045921f129 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68267930a97ec235fe0a6891dc474d739e600c519623be1bdbd230ae8f9f2286 +size 199058594 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..213a3fade73e3ce870b3f25e627c35e56c1f52f8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b65af24f220d6034d016cc1d1fae55b2099c6bf92fb572e767dd724f678b9da +size 199058594 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38398a03716ff045ae364b99b904786307683167 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab614cd9f78db1bc48da0f5d4f0496f43dfe757dd1f50931af1fa0bde2bd4d3f +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f243248fa22987929e59e35b9ebb6d3d96590bb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c21910903a0b07c42af2dde8908af671c7bf9f012193da164251e849121bcd6 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77307fc91b06fd7556d4bd603d4ba44469b4c041 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af968c2d78095e6c3104ef4963b3b56fd408044e2f2670a0ea1ba13697d61419 +size 199058711 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10957c0e209e925a4b9b64a0cd2179cc43e0382a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d10101d173f6aabce33e47e25ab1715eff963bc7605143fd3db0ad2e10aefa1 +size 199058711 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3dac23eb9668cac68752dde936a7d502982c4c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89e9b93524625acdda99af8b45e16e147251983fbbc11570f420175307ae472 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc8d03f2f20d3cca3f12d3d51efb671f88eeb20 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb9c035844476878911faced211b016dd869b83928de2939aab39d79e90bc6d +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4891cbe602438019db672ee028b1211616919e8b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97369df7108a7c6d43c51b843ade9315a3abe2cf988598a131edaf85951d711 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecb46890ed7be26a779911c64a493e786d08ebd4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86b593d70577a6bd03dacf8b40caa9713509553dd8938bd0eeebd0fa0258c05 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7e2b672e08666264dee696cab6578b9cb03ff3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ec49cc12503d66a421215a3f21226b5291ecbb4dce01590e6f74bd601f07a6 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cfa4162fc6b0d4f20677591d9ba08ebfbb99f89 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d389cae38b4d68690d6df394dced9f08f7b2cefa9aabc69997918d4ef4d169 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ed899b395b0c88c7795a17f30974895847df1e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fa9cd4c95c7622137ff79d13dd1bbbdc408194b1e5021dbac7e06ad6bcab47 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d99acc782df476658da016ba18151b6cfda75e4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bad12316f8f8cb010fdfaf79cd5798bfae702e78972f4635a0a8a1ea87e7134 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b83066be1298ceefa38c741afa0527c0e308c174 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973f6c1d2cddfc7c2397b111c48dc9192709dd31027692db6c8a58281405a9d7 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46be5dd14b3bf82103967965b5befd5558e16df0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b292f1618588ea3df9ce5f898e769d5e9a05caadf2f33c93d6c76ce7a75eb702 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f5b1a6a272ac061ee77b11c4df2526f56a4d02 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcd1ccf08f62af59d724ec7e08f59dcf842373a1e28d02bb6e8c6f141d1f64a +size 199058594 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71871292ce22ec16b06b8363f60ed276d85c6a05 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:393007af30eedcd421fa40ea3ce4f4b154654a7adffd8ae1d269be831e05f6d5 +size 199058594 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fff26621d05afa4ea34c292350faf0d5ce49563d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01f2bce2d5099a6ee79b78e8b6c690387577a7dc8ac36204b291ba4d2a38896 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37668962e6a4e531dd6579bf2a4bff2cffee928 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e51e6d1ad26a983c458a44aec9ed68c1a0dd2a0fb6c456ccc77a8e868a8bc64 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf584bad3dcf11f82e1528280a193d2ef1dd590 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631d9e04f97d5ddf9ef555e57778260e67dfb35620b891e1d0fec456b6a3385a +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c2cca450ea9280b8caecde90327b811f26c6ac7 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d620f9df2bbb6f28acd9cc3cad89dfd5f0dd2f88bca7f0421d65c1f57844f0 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1befd928f6ec3ed371a3e3f13734aa6aa35574c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2fd7b34349d03f56b28645f264a3ef536ba04e81e5a4bc0a3ac4b961bd14a1 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8b3bfb3aa729a2b05d3bf9f7026a28f578894c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4b5318afe1dba124ada5d68c3a0a3f076bcb00cf6d1334d50901a9f57d2d3f +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd4b2c8cd7db2ffa68ac80090d7d055557cff410 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad8c0da7d99c5d8fed6417f316ec10f4af23e49f04ed3efe18ca23588deb467 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55773b977f577a01e0604f83625bde5f1cccaf3b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86406678adbd758ac3fea5bff81ccecf5ef3e302248a5e8c159f38a37e8d1879 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82973ba336799798524a8d1f0c6bd1d68638fc45 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c711767d564cba6b29bc6cf7dd61a5b52de383de1c94805b2879f3cb7b61b62c +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..115c5fee0e43db1a407b1cc8d0b90480d94f71c8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be4a93824dc7d7858545ec399766a72f8f931110c7b232987cb334088280730 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1144f07a5c182242229cd40357a9500c3c830b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7c84a133a502806855b1962f9e333cbd73dcda23c0b1a9c6b8cab3c00f72d7 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..007fcf8e2692dd7c59e47829e534004291f89dc0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9852da7f038f808aaf51ee8e4136c25ac3f86bcc3e7496c321fce9b382508120 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..568ffc5c0a81796b2f0b5439d86fe92e8de517af --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fd43d5a01703fc197d0ccd1f289c41d961a65dd521ef66294cfc0cccb8414a +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f66613cba91314f94c3e333298e834904283e992 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1584179093d3ad45894dbd9feee586b6b6b59ed5ca0f7367ba6fb4a50a820af5 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a1e07c3391abf0322f2ffa36c9d3b14b9b2488 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a597a9d0e6358cc62b13dd9495991feca4480b0718589bb103c9b9655367f5 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6794a789677bac0d23a238fc4d965a40c87a4169 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea08ac09fd357f0c613055d43524ab97ee7d19e067ab3bd0d41f1864ccd5e7f5 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d5faf84bd34572628c543830707461097f7713 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74575642664d7976702722311aa6faf82487565a5308e0d7c360f680465bd9d0 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d725035dfa8b92592b559983fa7a3356f08a02 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b013f6121bd6c8860babacc95f4fbfb90f447f7ee3d3b02b5fe6f364203538 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9399b7021f6bc25d5339b094c918a0330df3235e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788ebbd276c50b3d15092df5b63ef7ceddf6834d7237bd9ff017ed595aa4dee4 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbca7a80c86d9abffd2f029725b73ccd97d4f6f3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1101035253aa6432cfad216d53572cf7ebbde94f8b31197ff473e65ade359242 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1368789586b0da1f3248d26f0d1685cfea09e57 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3dccf38aca96a88e14bfc303d5823c752b9750cc8529f57a6d038bf203feb2c +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..437acd5c2b1e2f638bd33cad33d6c687386605c4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a56894f0625ab9aa9ce982c337fbdaa43fb10a72c5fdb1034322e080af4d6e6 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3f55494c24fabbb46327f8397701908186cf616 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71873ee26048c1533dbe0eec405a16865ce21c0d4d0123b882a32c8e096dec5c +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88f6af9a9c9b7ad2ff522b24e5e70b554f000e85 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15555654c78bf64f1d760136f8d1e6645bc26f74cbc9e73b95a56b7b3b72fa9f +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..478005477980b94621166d49f7c36b314ce6ab3a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a1fc3ee06074885063f0f5f16c1276aa289b857c9e12d574f190aa7bbc00c3 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc0cb37c3740cbaf75d78e58cf39ff3176202f7 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f0e3ed585be3cf57533bbff5fbb90146d1f50e17bbffa0ff2783c1984ac359 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0536c7e5c33851909330386cb4326f16681420f8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6f63dd266425fbda3fb0fcf8670ed00e21d0087fc6e5b4794be80df4bc4f8a +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2afb9363d2e3c13bfcfcfab6b7de9b8ea53b02 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5859b75a22f128071f68592932c4912abe8e9882402b04c46a0c90bba52275f1 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43dd0fa7af9a7cf365c01db689b15a7a554d992d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca5b8ca3424848e7bdac7b5af535eda354460ae74f36699126e3aec04c5c304 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..915a1faa6737a1a74fe777b9c54ae41e243f609e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b76460c0f9ff1583737a020517ea4387443dd3668a1529847ecf07fecf326df +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac0e0dcfd92e65e6fae6f68dd2d2b155aed1a11 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0d50656d02c21d45ac3b38a688a26c5672bb3d9a24ad0541d56d1e9f465472 +size 199058775 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..435d8071cf991cdb11a62494462c2bd09e1c5a70 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e03b758d271238b097db137e03e8475edbc898453d7f45c6038fa69fed3e2f1 +size 199058775 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8efd501bc8cbf85c895a1b0007a34eac59c17bf4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ff91178500e056c455b2cb961ceb8f974b73ef61a213d3fbb9618f9e36ddd0 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af141c071ee44cbb566d21e06145203877e5fcf5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4498d1fdcf046d1883dd2f0aa1d0108604b57977c3073f3b0a958997a0dfb0e0 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef452df4f1c8bc559aeb5bdb4b6d599b7a392de2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0b03e74895f99578d892a9678b17a16fcf0e0b47c6241245d1c471d5281520 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ead9a3bf289dcfc6dcbdf22a587bfeeda01d593 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a7efab0d426a8aad8e70a593ae6596b80cf13eef9cb27858cc088aa443775c +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9d5a59b60d8d8c7d30a4c7aac4e0c6aae860ff9 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30753652a7053528ebf0b0acfdbd4d1eb6068a2e7648dcfd60aa884d5a08f695 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b255f074c99cca9cbbb2ef397d91e0f89c152fa3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96db0e321c9bf651076765d7bd3c7e8423d8a38e4c2ceaf1563680cde608fc5e +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecacaeef026283f9aea0d3181a8c953466a991f1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e3a2c06d9579ebad906e60281793c7b9c467f2c7e96add74ab0aaee3c7ba9b +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dba19056f79c708af7c9dba3bb0c030314dd2a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c9e9e68eb9e1a24fe8a59470f0b040adec273648b472dc38b67bd609045e17 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77bc88a368ef404cf59a485cd7a2553a4fdb02c7 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e986bc549ac00346fe3744867492b5d8e3ae4cbfcfab1728de74a1884bf58a6b +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39eafe9164916a5d6176557a1733367272409e55 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c030408d828438fa7f0fa7357dc8ad9285835efb16d471342f76ff2ff733a4 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2001df988be2d520c60449958953b93790a0a11 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5608e5523987c282b732d3729db2faa9bc944ab10c944b737e0df58637fa6726 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1f353b493f7230c398184f737d3e1afb9e2f7e5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08eb2df97e551f674d9d7e79b088cb6e1445b8fd90b32e3a9f6216f494205653 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0e897dcb8b33c51ec1cf5ed00403bbbae6a1da2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348e816959e6100551006f7c85c8d007a689e309a4e469b29a6b06a7b3ceab96 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..328048999caac26faba42f196fdeee4548ba246a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbda11f2566e0d1aec8e5649035fef455831e59b6d3a3431353cffaba426734 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1073f49dc3c9935b0cf69400bf96489c9b2fe072 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae15b366361748cfc32d9cc91ff366fe57c474c511d5696ca911e095f6db80b2 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fc510e097f1f7df3b69763350713ab5dc9a2545 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a618868652d2b1a5c464037ac6e0a80da2e04798088e2a8b514cf460a6bffd1d +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31aa83dbaeb03133e34226815f918c7af11e9617 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f61ca475f2c1ae5a0a12046d9ae88a161930d305c08562cc353e541c6f56e5e3 +size 199058914 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55097d8f2354f25616acdc68da4c5238f6b3b6d2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adcee676fdc28e7bc232fb4bb18a86075804321ae18e1ddf350b3db8a8571d5 +size 199058914 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6538cb0247ce5a782e7c6e0d627ae3cf6f41ab60 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b2406c2c15c37a115435a19ffb81b6b856c191bcc42aaf6fb64d0bfb1293f17 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9311917c8c7f828bc071a208f44a86364060d939 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48954ebba02df8541c21b6140762bb8ebbff2c8dc5c7a26d48c244587b462a2d +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81b52b978733475367a443b36571785922d9a2d6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db1ffa52c765f9ea7df8579641a3d785e11f62d09f62255a8aead60c6356b58 +size 199058711 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..626a66b04735fe041692534ce8486fe65541b3f3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76824329db586fd6bd07d3b5ebc9954a77f6ea6c7ce033f2cd51ed1df3f91dcc +size 199058711 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..436264c9e01c1d43d6c636be939af03af55903ed --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d79625177820d6f09b42be4349cc7f3d8eed0d5f4f53c285db2f6fe56f5d41d +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e70da2387d92d8ab4b9bf813b37adcff503ed8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d1706db8c12de09f3a75e307730f5f277b4e1a2eb7553b0cb9a8e35afaf12e +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9b07c15cf471f9ec3054b047268904b0d357bb6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf32ddf92c90d270a73eb552412eb9b303beb0737bde814fb3bb7cef3b6c96e +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3144f3415edfe411d13af906f2f8a2eb271ccd7c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789c4b9a9136d1c71fd9fb3a70696745445c947c6b02ebb101e712a3f3e9ea3f +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..345456b202b0525e66576a5a2871019221438fc4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8595ff46ff81183cf8d2e101c3a00751cfdad7af7b61bd7d853949d9570e7d +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b4bd581a5de20380a6d16e8487c3e523743c67f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348236a4640e0ad9552ea4270367bc2d33d1365acec4387fc3a31947f8591811 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..204b4527a6f5c49332bbffb07fa445b8ab7c0731 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f811caaa5afdd5907820e0a6a8136e251a2054f553e2739a18763d2e22367404 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e274a50605f10c9439f722e8e46fa0a3c74b6a22 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2cdf485b4d73242d8f38c2b0299ab50523d67571ea657a1865ac21e8ca4492 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd2bded5056b67c1e80091cbe29c249c2c81df4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b671e89802f526d8f45b00930a0925b309aa227387a68d9e5010ff7691169fb +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..124a51e29e8a563e18aa5719855eb1fef9e78f57 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1c6be152bfed0fa2e95369be23647cd7672066e398af78e6dc3702eb06f214 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a59e63efd0a86c0298a3491121b916a8f50f19 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08758b793f2bc14828cabbae984a32876879efc5c33c249c9134372332a8bf05 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff7a0c7b23e8d762cd16740ea8b683a810180a2c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5437f430385a7117f4673492cd5636442de6064e308b6c2d19d67eb215c8d16a +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..828705af643a47588bea4787a55615c722ab5586 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f77e46db961874af78f90b0ec9f7014ec846886459c305c4ebf2c064c88219 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ab573a1cafecf2915c960a3135ebf00dc852382 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e594f4ebe1e265872edae28dab6efde161c319fcb0520b66bda6d557dab090 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..509d9b3a7469c55a5b56137882c98819d5e67045 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4458a0ca488a8ec5010e336b5d714da8504a94b00830e4b4547001585a2269e +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4186b6d9dc3757d5a7c5f50c79cf44271b59bc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a960ac519e5c4467e8153ff2be609d2787162f514bf1b96860fc44088250db0 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..819f3501cda8203bd582240c18c80a74ee9a91c8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ab74f96cc37dd64f3faac1913fea5100f3d7b5d2b57c862b544bcf047831f2 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..777a64cd666fb78cdeefc547ebce7f61088b7835 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e724d0cf2d4fd7ec7caa89dc68939817f09fe13edd6ee52b97a8a368cd4c7f12 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edd2f67b7da339dc6d56d14407d0b0d72bf67a6d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ae3758099079089446ee20869f37b8114b21031a3ef686bd4398215dfa9ab2 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c014788c3e8c9c4702dba953765d5a8d9dc0ed4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c17062de217b8f14f8b79ca82e5084e8873000a0bb91c00da8cb3002e67ad5d +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57f4382051aa8aca30539874a15766f123ae0c3c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d66aebf69bb26ee21500324cc0eb9e18cd7400f77479026aab04fac7d170329 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..803846e066f11aa541f5c3cba8c4cdd60bb33c71 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702efa84b02f305bc9634b311ee0f8cfa253bf237d37402b43d9171a576bba59 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1d4cac37c6b6cbdb8cfec7f6262f2d77a5f920 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb142f9ad7d39477fed7fc3cd27ac107f2fe86b7358f4e147d5a375857643f07 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1532eca4058af5fb734f522ec8fe6c1988670c93 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c202193ddf13505228a7cac3b8e4c4338ce7d5ef042d9c465073627370658c +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d244495671a5f50a6a9a2e69917bae6ca03d4a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c230506ec6d8c51529a5261cf8e28276de22639bbe20404ad56fe5291bb8689 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e692fdaa0d6389d6805d5367d14a884eb20ca7a5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6839a1941c3a311cc5f9d2440752d13180dbbeeab00ead3f5c88988665ad8938 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8898cc0bba06eb9846cea3e47aef32aeae748c91 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a727c556b6818e0f64ff350ba040f9b68936b5129ccedd7af43aba9cd8883308 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff35d158673cb088ae35f63da6a3181816b0211 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ec7be94c756dfe9214c89b6a9427b60e6c993b49d15f3a2db5ef1027fbedd6 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e976548c7c695b2977cb0449593fc958e9b2a64 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06aef8d4b203d1e313d2fe6c1006dab982ee2cd129c504612a96cac39530b057 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06bb02665bd696721f3c1a925a86d799b9b049a6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619836792e329bf188beb97b2bf23406fce075fe4547859a9595826e7921e25a +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c538ca92c5b157c0f15397a6471aaff0efb9ab0d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e798a0aa12ec2d0a97ad8944a018c3424996f6f1938ecf4b7546f4a9cf0c1c0b +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5eee435c8ec030e2589acda2f5b76823c91e229 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca83542e864fb102d8cd7d90cf40438a18f21fbdb39844ebe5b41b2a9050be1 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e84fbef415580c95462627b44dce317e43d980 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba179ed73c6cbc8533a62a55f090de568708cc9901eded52c1ec538ad4f1d22a +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d34bcf3ac90aa32f4ebe826aecaa056add38611 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b09546e4303175c282ee2a85ea3ccc307abb79652e5b84d6f0e7581f5d08aed +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba357a2b540d357d295853537f1ae7862bd7adc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d83f3f5ca50db3274192a411ae3521036a6116484ed7332781fc25bd5e5676 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf2c92cbc518c5bcf10902c6ac277d90b6cea621 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:343b4cb5623412cc9f6a52487faa446ad8c57c196a2cd530e426eeed5c3e0fc0 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e9b35a680cf57ccfef57af0b89c64d6ad98ed2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:333ed3a41bf0042df589ced86921a31e2b34918aeac09231600948ef8c0955ec +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c571814d858cdad90ba54edb6faa118db2b3a08 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fddc7c28abe2e815afd75179b5ab49d470b3dac10a4ac194c16ea0ed67bf3d6 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ff5abfce404e9bb3e3b7ff26221d064cdeaa731 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23487dee7e1bcf931d955a9efebbf27c18b98bafbcb2b5b16d79a3d221eb2089 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7145ed951b9c5af53d14087bcc308d5991ba9ed0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e98903923edebc7f4accf6cdc5e5b36e8ab464b9e9e5e5763f2aa3e6a9d8b16 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31dcd2df6dbbe5e58bbec22e0cccbc5cf996560b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:002e47c0af4fa7fdf049140658974fbe7aa3d7947d32c7d99c00b775c35e2a44 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5425e0fbae31a5979c01a288e1a87c638ab70b3 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecb9612608668a3948ae550859cf4ed48b85099a8e33163b5e2a73c66ef5371 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8562b9f5568ad31577527e76edeb938a71e615fb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a53d388663404c9179669d69dc4871023ed76c74bf35a898633c0eba7a90f42d +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b459da4adda2f7b0d4a4bb31e5a695df509297e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22393cdf7f10fcba2fbb1fc095e5667bd77794a3af24497ed6755dd5c3f3a843 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb5da2432b33244d2ae127b00ba1148d03c6326 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca1d8e4c3d7481a9239b929fdead12ac7c7835ded9f29a0e72f2e563cd27ca3 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16ef33218e644eb2eb8d211a0b23c97e4ee2e66 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d8806927508f6888939487b4ef0047e557c4070ec77ac4d13323a8dedd1e81 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e756a074b9bf9ac8930a4c0308a8e48695c8dac --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a761212bcc764c3fa8513c7af1afbf3d5d2b861cd79083b58bc1ca876af8c1 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..288516939a34ffcefa0b3c94640039422789a163 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6e3b51ac66e981cad48ae87b04c48bcf0f09a87871a68a9c5c690a5771e0e9 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eea0f6f9deaa133b0e85bf721c61066866e29fa --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cac9afa7a577a9eeccef620942d155a3255cad20d84b902fcf03a0f28341fec +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd6469527a912a7f5fb5907224f06b21480b777 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ddd590c525362bfea57609a37d2da61ff5eea55f4c6e93c314412b83b5c85c5 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a33bcf41adcb35d16ceb7ad4d663130ec919064 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b54c8b12fe82d2593d4f31be1bf17cdc95c1f09dc27c217b3927cc464d1ac8f +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40bf2fbec4ed6b5e644b699ee21a3d4d5c7f001 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27723ee345eaf6ceacf09b0b5de3357623bc1d13edce8c965b17ddb8951f79a7 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..592335b4c5d7790d296dd8e4be7734e05c7d0538 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec029bbe616dd290e4fd56f56280793e520f7650b103c42183e2173e58126548 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d68aa98f9388e60f8a9d78b785c77a31ee2a013 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1eb07804357bb7738c1b0bc9a29af5d9ead22e261a2d3d1cdc5eb74f592f549 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7782f4364e18fed6f3a7f82979911477213f8af5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4647e1ff919399e58ddad7067eaf82ff7719464c4cd715dda3aff1526afeb0f8 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f12140b1959b45956a63d00305e2ef2511c8a2d8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3fb81c9a8e2693950e4c97e2048ef1338607bbfb2333acd1d2fe1136390050 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c38f3db63389956b0ddde57687efe9b44103e8c9 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21bbf609f4a30619d8257e8d934d458f273c899b374135ced2f91c89326bdb3 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0400adc3d1379672be3692f92c3d0923124d38c6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb4ed0ca4c6880f390050d799606718a2bdeb71fc322ec05ba2703115287311 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89842043c20f090c3d0b44adbc01d5393d21882a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f589c1445132a77169309546f8a15636921422fecb4d54100f4aec38a6027e +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e58daf7c474c489f654d4d278f85d300b0dfd6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412dc4267a7c9a0ed4d6106f395d1a874492515becfb31fb0e393b19ff2d6fca +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa040aa2e35ea873fa3876feda6eb0715715b75 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0791df45ffb7313690b6fa54d6caa0e536979188c7f4bae3aaa09b65b43440db +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e0cfd14fc28c4fa9d203930dcbca025de19faf --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd32a0111666d648e8dac0c7b818f1b3ca9f9276139b16f496b9ac7fe04fd26 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..847f44bcb04a02e3879c457220e9b0bcd8d2b7ef --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8c87ec1f2b98bfcac217d323d948f0530134c4b96e349acd309ba241ac1646 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0171b9036d4fbb879515c9f99bf1627f9ec9788 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6356f32a7a774cfd053881effe97fa15390995ac390fa532196bd1c4a89fe659 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748f868c767b868d6aa95e1febcb74cab06e8bd4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62c83a638f6d9cfeacbfbe2fc1fcea1b2db460e7404625957a5f2ddef2b53a86 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e7a748d5d053c03c484a594b2f26b403ecd80f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fd3c8d7751036ef8f45de67f5cb2b352301ff0ba521e2780a3d8b35fe051e2 +size 199058647 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff11b8ed223555152d213f7d9bfc7f2b04ab98a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56cad7b104500ff1fcdfe620a88d3fab3fee38df0c48656660e5579a999de646 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..954b755f4f75d0521f0e537dad6316844f29c0c0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fbf001fd7e5f8432970b4f0c9c0dd06645996c0fa9b4a3b443a4eafd2d9204 +size 199058850 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2261b1f1ad39fb9b02ed68140efa8ec2071c64 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a735904d01baab63c7ed8a2502f27aee8bf7fed8af3f71711c8ac2f70cde23 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be76413497a6a8df88cb34c7ebb68b09821c15b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a95cacb5936122e95c74d25db204976c87a7730432bf61314ae1dd6e6f9a9b +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3bf3243e5a153c7979ebaab8e15cbd9d23b7545 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a672d1938966ee949b3e40627dec0b70021375838e5aa51f913de02fb6d42cb5 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f86c8d853a3c126d74303ffbe8e6c089c9b98da --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd7a432d3c2958d71cb51516e29089337167eabc0d6824d1572ecb321577bfc +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7239c6500f00e38315d1262ac22b8d204a34b47 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22feb3061109b4cc7641e72e8f738a116d586fe4e45648edbafba404109d9746 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9f219dad0a9995eeb86b195cde5d2829062d6b0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a320392470eeddd7d2336171cb9d55bfafd115ed11105beb933383b4dd02f2df +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1373068a540e2d036806ee0f3aa7f7fa99243c1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de37bb9c83f752db0a835de1ebdc827a28bf984e71d82f52a3cb4065e7ef86c +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf63786aa120a96d31cd822d71f604f115088eb0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90692dd653847b92b0d342cce954135990069cd415f4c36ab8b7351af2068a9 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37984cf7f5bef788e741b12938cb9d3152859f14 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf83fd4287b4656da8a12d83e4af085896554c9697e64818ac98918fc711d86 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75eb1be1cac1c52d48bc2421c2caba3f768660a6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c977f71a58697f694126d417c2a9f650d840d68a5d8b52d05692a2d8f37c1777 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d170a4393b3c74a728531122651558979e3fc37 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf3d2429b39bb25751abdbcf0a017365a2bdf98ef6180916b33ed4327aef410 +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e86e3b55e16dcac0aecfb5a0f851c9877f4064d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3319ba1abe16d881db0fcb0b28829aa94e069af4fc4ed22bcfe26cdb1328862f +size 199058722 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac439e02ba3d0a0e10f412581f8ea262773cf23 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6136c0bcf4f1c83a0edb252d4f439c8e3b22e02dc976bd6b6282343c39b5b2 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab14052d2bd36a4d41a0c26f94ef59ca038a141d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b41dd232e8b7c61035c03e7a855ea2cd200eb1ab00a81b305c57f87d78a8e9 +size 199058786 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac9a3c57d001322740e7f608a057a66e36775b7e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ce49655d2a936ee19ddbc88b5d6d6c9a9efde768ef1896b66f252f35f5de02 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3de226cf870e86cd77f0cf3e967a4e54b11b99e9 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8155acd596d01a59a36324c5ca99afedeae352fd4d8761711a6762d8caee641 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f897164ed64ed15a73891c0cb9812a8076ebde0b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a646d2c035445d19ef9359a7bddfbbd5c8488a3b748ef15967b420d54dc2cda6 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d204f6898b3485a7e18d6e60a49997ff1f620285 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d66f709dbea51d63a31a494a5d1f49e354e1fd654783085e440797832b087b9 +size 199058658 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38f5f642a38198b223a1e123101d2c4729de7118 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c09f61a2cb7982c64e280bae2a935fcae07e08ec592e54930d01234284f3a23 +size 199058839 diff --git a/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f128e15bd957ab5ce56e77248c002d1a37227e20 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba088e6dc02681286f51e44e7c307880780f8b0ea6a2b7b76ec793b90956be15 +size 199058839 diff --git a/4b284b17bc4seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a967aefad48113d53776045dcabbb48acbee3c76 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e0679bb1994fe466d7e3f280039a95fa48bd30df1046c5562e5af210753c20 +size 167511299 diff --git a/4b284b17bc4seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ef811f8fe09c99753444cc819690110a019437 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d1010aa2bbed9bafb3bb772bd09a8747756db73a1f85b9e090a3451a1cba8db +size 167511299 diff --git a/4b284b17bc4seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e43d14643a8d7c37a4589b0b14ebee05244b555 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e1f60e929f96f9bdf42d606d6b1f690a7ef66530a16abb61851afc9138e062 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c346a3ee835991882a3ab6c28e16a87c209b5e8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7317ce089cf3d08757d0bb03e2110657acebf6100da1ae4e97a5fc696a793971 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aac525f6c947d4b38084e4928bb5aac67203000 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25aa6cbf67b7eac213d3f00b6b7a859911e171beb9126de013c0c8becf597f6a +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..283c98f75f946469b23b0a81f306abc7fda7c89c --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c47f4977ca4d4288a5130e3d2d469b71cf47e9980028ca3c0410ccf09061f8 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4ab810dd343eb0eb40b55ef2cf3228f5e2ecb9 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216296f27e97cc0b42d5a63d0b1cdfdda8e1c720cf2b73531b1b83a00ab2a5b3 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d11c4c1fd36146c3177dc73aa5bf6e231e40b89 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999c855b377934e98f02c00626b71f16229be4515c0286968f9e68ad92c6a823 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cdfea046ac0813a4f18a1361abd1b584d1a4b00 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed23fde93140c204b4cefee640ef2a78e2bfdd2ac9558f451cec6538c426ebd +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d444444f49801d1d9e7978876231382d5b9d20c4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1773bcefac8fe5dee8a985bb634af5bc85738b78989271b31e8fcc437190809 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d95fdb2065f487f28009f638773a093900a5fe5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed0a99efcde6df45f07df10f5fdc91985277a13fd53f46d9feab90e286d41cc +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf66faaabfa34dceb7388086cc5442db8036808 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfddd54c864e7017df7e1f656ea0623494910748a0c9226a59028cbe290de9eb +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f8a4b7355e1ca26f458d2e6ffdab66e673ed220 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f13aaaa53372dc11531ec98657a6efa15836ecb77a94dc6cf00148c0219a75 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776f613a25c5a28b6ccb8a059dc7da69ec599400 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c9a8fb33ca6d527b0fd7b2ca80abb384ef6a6a18f5a50e523d9708b5666669 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3744cc517a4ba361bb52527b32b48e9f1d007237 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2560bbda0e5934af29c852be02aff1de60983e26a2bc8f9c9f7a23ef5d49ab0 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f83fa599b2b8160d182e043d86969ed85b3d1cf0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cd6c3443c6c80b69396be65503c6c8557ada5713102c2c0a1ed48d88a66c8e +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e0b3cbad14f3476edbbbe83659d6c1c59cee58 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75b31ef6d5da1c3398c3d68da0f2f2eebca425ea3db51a4639fc3adbb85e5e7 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..245deaf28ef9a4d09846adba947f6f6466b7dacb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc4d15949bb6995d82e53504129606d7c353c8965f2e48426c3cd4bbbd07a9d6 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d458308bb5a9f653c928f5ad574221a441b8b5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a386346bfac74adafa55e427c409d259f4c950aa527da8aad71eb3e0843119b +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab509d58f82ea7f7e3be01278e632a9f00fde0cd --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1121499454cb28ae77ba7d9fd22dd81f2f890bac6ae9d7bf011dd81ffc1cb3c4 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3a6430e2024b9966fe93201a4deada05267926 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5994ba8d45db89942278db5d2156a2e829d6746d0b2ae77872c532d0705890a +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d5a2a7835486e845369eab8b5984361dffa7181 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64e492c400dd3123009c0a799df55bcb617d3a71d8550167dd8b1fcaeafdbdd +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8eeecf2ffdcfe7e05412128dc5077ef9db8e423 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72feac241d218198f5d63a507f30f5dc33bea694439dfd63d44422f179f42a25 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94fca3932d48602fc4fb3d38a7c449b2bcb51ef5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4131e20e051837a8167d839abd87c7c6d0b4529f11c2520a9f5a84c8a381240 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..723f444c3fe9ae48730195c3fa80f77b4575a2ff --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99bef65a1796896121547e0c4a01363dbb513e2d656d3b98e408632620b41bc4 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..429caaa81873a48aa96da4d3683ebcb5b78742e0 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be4f8f5de98a6966c618e767aae1055e485db3405bd62f53bf8086ba5005782 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1452f46e58d8ca0297e2fc8a9aa324158edeb8d5 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44851759f91b3e4708dc297b8e4a59b79839a7ceea2440ec48a437ebd948bb62 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e0732e540264fb1c8799625518e3782cdf7d0e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3ca11dd42280a02ec11c6ef97854949a078b3fde2258b2f78fe4455eabc402 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..377222eec4ca36f7f5811dca056905235acae462 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e624243bb5dd298ec19845c819597c730b32e87b95014df43d42ceb36d6511f0 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35d1c5eacb5bdcef18894c2dbd75bc8494e7f747 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebfd1c8b947f33b8b4d49ae6c714587c7af122f1cb811b50076db7c7b88db29 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd95969216a4b78fefc8e70cd0cbb440b9a8f9f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d23e9e9ecac33925b0ad920fd6f47adb6dde859132878b0848b9cd425b7ec7 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07101e6ea80f9b08a95dc734237f5d7edd1c472 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f96a0d20a056ff0611833084074cca7c31782b1ed8772dddf7be676ef7e43c +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3281b2e41e0a75c4bb9c95bb0d7ba15bdae9b4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2be5781efc4ec63056bf7680bf44887bf8d36c60519ce836a6fdd5b265856b3 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eb85ef3958eb80f4b3e56ccbfc4ede7f480d73e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f746b4e2a004d92155e52798ebd70c5e8ef7bd7566323bb51c2746bf25c72c3e +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4456f71c028251dd672badfe7ac7f49c919e1268 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60dc9f9e7239335ff5773ba9d86477df2b3e120d5bfc93500c3e21407741f00 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c2adf18977a10bf5fcce19ec758a5f4f05bd2d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3e32149c4221948c2c1bc21af229d82ea8b928ddc2d306800514f0511d0525 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa84832d597fe1d8a44eebf70405157c14f9a21 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebae920415ae0a5c9d5b5e690144386cd216ca636cbe9b614f109e63cfb9d565 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..030ce8ff168276b28d2521436f37041f00897747 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3268bee05e5ca6eca545a57829be8a3e62c1caa86e0ce56bb557d42cf619ac40 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a32142d7c4fa8cc96573fbf6e9a8e6e01ceaecbb --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db4ffc8cea4034a045db96d0238a5ae62f175ac49768bfee19b9e22b7deb70a5 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..929641005051a8f6edfa75d79414834ca3ec17cc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d6c12a3c321d2f66405f174cc1fe9aa3479a4f660c6779173a946dd51ce334 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89169c9a24d730705faa7c6c9926ae3c8dfe1808 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9666de1206c1bf488fdeaa6228f4e4cb8e0f65ed0ca213ea7b846257f3bf4d7 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc661b60e1a8b57266b8fb700494411722c4f49 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfc55b43a39b71484721c5d04130999a61cd46ace262d8e32d16d2f7f2c0a51 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1540412cce7fb8e1ad269ae6a580c62c05883309 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59cd5a9c32ae8feed4a1775cb278e5a4fe5f6e505235566abfed0e728bf6485f +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b91545d7282697ee487d5e290c5eec1b5e43de2 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b763f5f8a8f981d1502d97fab498635b5aea1499edeaadea080ed3a2b62fbeae +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5e297dca584a5c1e1d5149af14fc07e74e782a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d575e6145b7fd5e1f84054f5677ab2b37f526072cd0f9580ccd05270c3e4b14f +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dacdfd064f947697f5d8f9128b5f3e0742a84035 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200fd702e5497c88b805dcaf498d77dd2a02d9e448d9d78f21c096c606d7cec6 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee260f75d61c9c3b43df1a2ca93991ca650bd5a --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6992340457128808838510be36d82bc6ac08033d3533b2190bf6694a6b5f3bc4 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3950e6209801d7f41d822b09bb85cc25c386ab --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b84d2b00b5ad5faa6f501c6c20ac83762bbd7076738693782293abafa76b324 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0753a26bc65f5d09a650338477cba59173f9a19f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221faf5bd46c073c24d1eb8f8a2791b08b52c45d30c223dd0092a562fc193a96 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..483ea8172bf767979a502175e187d5dcb69f380b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b327f62b6382ff729a37fdc53ad34c4802f9cdceed70e0978ad878b464c80940 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..946d3011dc24c4906007bc410040e5e51cf59c41 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117017669322c3632f45491a64f977997c12ff823d1ca76ec248511b5c81ee46 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e1594362099228ab0794efc72ef6f298fd46f4 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5bd8e43370c3f695de9ddef0a6641c4df465cf49b6a565c9db701192c1b4ba +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43c151633d6e3eb6a566b8e70dbc81d0f010a532 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50fe5cc7db40d400f5f059db509c8ef4fe1e005fafa7d587fc536bd838a3cfc +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c3cb033a3d86a17450bfe087bcfc543e9bc2c9e --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748d811db339912e23408a52fd0923c9a7a8015514d1b5f793979ffa2dde0ca6 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f427478e3cb06e2e579003fb522bff2f0779113 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77694f76771fc84270724554339c959f6830561071e90ebd275ab40efde12bdb +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb108a2f704ea4ae6fc18e1eb29897d3f9da180 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20839b4d1ed84e76029354596059100ef9e84f38a48d62194e5459bd4ea17d0 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8909d2172a3d6fb02e4ba6335eb51e4e388611f --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a9258437d620f50cb8ba8f2d9ba58b4a9626d12aeecefecf5448bbe3fdd7b9 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c16e2af1a283e6d6d6d6822b5a9cef696b4265d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75ffeed80872fbf2fd50e05a3bd8af23a8c1b5e57ffc73df979431c4e1bb88a +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721053d7ade88016ed871eae00851d055736cc35 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64861eebc13d1dd7dd433bfdcd05b3d32766f06e382305473b714306cc0e0c5d +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b382bbded3d1d394330886b612264b20131d2184 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f027c646907f36bf26bd30b951910dc8ff5f11b1f78b964e82bfe093b2a473dc +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da9e1e19fe4652344d228f64b4e76a5376c7b1d --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234c87b255b027f184a02339df3ee94c317886ef3e9f0f40e2d2c1f295f6abc1 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31826d0f90a715429cd99f1164f1e53d50b267ff --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e8a295e7bd58305164c966daec196171e3db6b8fa8ba37f13ef47a0cae648e +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..425e1647b0019881710eeebf869e31728f845938 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00aa9a17d9f17a9e0e27badce4ede8a774a47f4b388928670bc6ac8c83c8345 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff25615702fd32465a19c86f752548115268bbc --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf9376a8e6a7381dbe16c71b3d9972a8aded2a47b6fb10f1e0b77e9e15938c3 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed1c8d5d97c012b4ac0df12a24447fd4b1e0335 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81aee7d95c9eb0330d0970b34cc737a7d3f5f5e5acbdc96630a84a11017552bb +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b1231772c6463427a9babaa9ac62ca84ccafd8 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4aec6953ae2aec8cca230b2aa6871585abd8f1653a031b7e9a9963412f9d6a +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..123ecb1ba570364ea9b34a411f760d9bfad3a976 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f87b138cfaf59fe92fba99de17160bef76c1299cd2d7e4f6e5e0ebdc726b32 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9689b7c10b99b7be62193920af2a999a867067a6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c206bceca46dac953f77940d147dc2b2a0cf8aebafb97f3c8ffc80aea36c8de2 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b21fb0c3781e2501ae5cd7aa5dfd47157cb778 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f97af11084df1ab3797104cb7588f0e6ed98d69507335b3b639caccef205d7b7 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..583684c125bbd062257310347c564caab4c1640b --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b262746a5e156ce471b9215cbcabcc54cef0c5205a52b287bf0a2b41ccc9b0 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21db0354d11852a6f39f381382d63b846174563 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964bb230cf52e23979eb4cc371198c99cfc4cdbd417bd165c940c4e5435b83eb +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5efbe28c6872588696af348ff0c82e91d2e82cc1 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5956c745510d9f8bb49a7258d4d8862cf69ef47b643fac8a669e3f873b33a442 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2507b18dd0ec84f9405b72a725c8f5369a26c8a6 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fba62aec4c211c0b315e2a3ed3f8690ed3760e3d9746ee03217a57d125f95bf +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb38bfa32493589319e948c0f6a1a1c267fda068 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337f513f93306e13d2328187982dd60c86fb399979699afb8ff50195ac521d56 +size 113308931 diff --git a/4b284b17bc4seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd7ec076a4042edd04d689ad16f60e81f81fc855 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf421d8c7d85931c2675363d119729707e59367da146e1a69f0e3b2aa18473c +size 13507 diff --git a/4b284b17bc4seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b17bc4seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b0766208f2ab3eb0a0191939779186f67eefa07 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ba6b77b6d37af1b9b899d4b8aacfdec48543552181e3a103807e2f986de129 +size 13507 diff --git a/4b284b17bc4seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b17bc4seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff406dc0fef923bed7266376b460fcd50cfa925 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10642d72563e003e7dec72c8e721af128598f852134afb459c91694c29b90a9f +size 51443 diff --git a/4b284b17bc4seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b17bc4seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd15e6605571edb42a4131162852c7a07f3e551 --- /dev/null +++ b/4b284b17bc4seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:371b7fb6ab3ee190735ee236b1ab374b27011ee08d795ba8a1f2c1757455c76f +size 51443 diff --git a/4b284b17bc4seed2/transformers/config.json b/4b284b17bc4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b17bc4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b17bc4seed2/transformers/pytorch_model.bin b/4b284b17bc4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..49ecce4b463caa1ad88d9d50613e33b8bfd48a54 --- /dev/null +++ b/4b284b17bc4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3452e411f237429e2d4e4fba0064008cd6fa3d1fa85a5444baa878413928eb74 +size 8781203669 diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca5097eb28db369ae1a1b19a263e76ffc17de2e --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.35083434984315776, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02616449883888229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07739855446963606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018358644772690127}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3134763302724362, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0046471347446950095}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11399015240080852, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020851248767886823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.035905098524200436, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010607078653530643}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1502077023294116, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031613346908548603}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05371017651870693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013244390739921147}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07417060220648813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001718378357658079}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3043598891090655, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004514547231263379}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10951433816263247, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019234834216121733}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07397072360499893, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017528966784256012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2998529800959189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0043877961837816195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10883876337087849, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019507314452992279}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1615a488f5d3698fba9440e921c654240f538229 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.46876992029559844, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.034927353982595874}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07681384925166049, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001374027323811084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38097873313953917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005175759754667372}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1197542888300053, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018385684763670012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03597310440100041, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008608280387754568}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18829701668248153, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003660067106053917}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05621234382196869, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011822787234320867}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07261876136034388, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012349384043881318}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36150967948798507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00480448094073723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11342676377933986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016697193247628803}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07302445423139715, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012977773718425825}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.360730723283117, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004772097268097439}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11374416895467514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017281592881802442}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e95510b314046da1e73059ebe3dc8c681c08b336 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5429004464487086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02956763370387551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0790589967959102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001308044694189035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39953213743199456, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005143398378070516}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12429985090438969, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017944563129484615}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03649208989958607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007894532891278444}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1981597561400995, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036947852288992844}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.057717005144251245, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001119756685357567}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07381899642907389, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001163187972748472}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3733176474539905, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004645414027325048}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1161186279960515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015898207130317827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07514756287869911, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012323384961919867}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3793258439410288, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004760005880194504}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1181098473843461, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016780964349225184}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..31512d8383e9fe2001cb19a5fdcd9e87bd6c69aa --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5793653489517963, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02573935152338816}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0784768409711552, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013293315467480962}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4021503169264519, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005139543525197391}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12359857437122666, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001817787926962779}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03647411331053875, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007983316045680896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20161790593954293, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037138076808761883}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05779858759830239, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001133882284527704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07257219968651211, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011559052093837042}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37199637183821616, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004566562333186737}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11438451893922211, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015822566905128663}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07439716631350449, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012402975601483565}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38041380356497384, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004723327182697422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11713401901641247, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016897910257232043}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bb95e01fddb484a12e05bef0fa42661d77af2c --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6580262070232321, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04463702693525373}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07997151746529566, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013223612060855499}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4160976831278536, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005209059570687941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12642774404491391, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001811209169725992}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03735306573238954, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008065591123120885}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21078514701000953, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003845945929146538}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05943674402822863, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001148742985890239}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07356263456582715, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011493251347300905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38274283663424974, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004614058978267195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11634952210670316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001574306459194498}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07569528441100878, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012352346049956824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3931764824594323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00481151360289427}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11962749419116965, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016873346260864468}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7d91c14483e9b18ac6121089d0351813593d6c8f --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6759695430973514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03994146869595565}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07937597458710605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001230884280609434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4260002708285773, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052002522148162}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12621183354053545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001677270665840144}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03663978847219582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007646406840406626}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21523323275826314, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003935924995816928}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05866875700675121, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010853175869745342}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07267084773310319, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010964268932708815}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38847122796901407, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004554143622718207}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11543687803885108, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014830311221567065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07511819509688057, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011627524680168457}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40224257158609245, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004821166920297295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11934454714588003, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015725681535582816}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6c242287781f1663bb331c57020dccfe37d197f3 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1462918858923527, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018287969954442684}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2450504599773562, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002667661163946354}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17041087012324713, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018311684543931474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03005947880661307, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000749689945277961}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05347020409310686, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014364834441163317}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.035613930630312256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008591133723511533}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11532653680505218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001297865996200157}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20027220225980916, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002181258587442611}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13592634771209514, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001325717122146055}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13318256778490317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016411379474036579}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2245030731427097, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002442243276829025}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15540170480114518, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016434471793746518}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.510865468208299, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06679702254496858}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0847cdfa7bc2beba45cecc4ccb940632940968 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2084513743720111, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027615910004934545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.29432626621828806, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028490942955253194}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21324165401751896, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001944169660478559}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.054478136936203736, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015417128687396466}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07498210243955587, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001693754544827238}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05258866077101279, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001046652141356547}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.15117682215157882, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021453657954331753}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21535233109008273, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022267862814059763}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15295761707945213, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013211828510905123}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.19591291904991898, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026104979706091298}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.277383576162133, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027253966450803695}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20046236036398457, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018314059922198284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.6743414261232488, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06424341960347561}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ad27e347cd88135118983d023c3837e91cde1344 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.24780130748953536, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003350152538855383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2849228433460083, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002870766788486399}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22139199215272853, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001986734930287734}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07110155096827897, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001996847414860468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07685904521692397, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017134959757600693}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05892704283287862, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001176092545801061}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1859776104589076, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028381550119400733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.210091559089222, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022706467792696946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1619118803562238, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014796761111034566}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.23444040733713364, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032065201609602226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.26987412705763364, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027419156490799167}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20929724279019218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018767292788178292}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.279744668462573, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.057469032972381}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..766efddeb2eb2bcee4f7c4c714f01d547283a23d --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22785972778596442, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004047623768336541}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.21841898213728125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032170855228152097}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17987775685234184, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024026596328742267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07010270751445905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002318540682504887}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05934134693437993, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016259409779823828}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04933111713020948, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012354318096556433}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.17649205283299266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0034189641055349324}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16398006288219888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025163218326892263}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13510911889705154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018509997343202566}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.2160404468571716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0038694496855073376}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20683146627158472, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030707094240185057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17018802287926738, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00227932442052096}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.235109631432272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10203278334805489}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..be9c48fe3a9d8ec7115f705aa5464602ebd557c3 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.07304913048414251, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030204336205108873}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06870413101811737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025879161404963476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05616898815912234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020232005142444298}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.022008239832194007, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014678784297010139}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.018445977428777703, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001048282411460379}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.015260812067633033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008189899379778057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.058029662196145824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025327184849280376}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.052447770497791445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020100089557701616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04302893844978566, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001564276452602402}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.06934359312412178, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028948978002469477}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06475119031792104, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024457820594378753}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.052971475992559754, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019124004314651506}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.26810587841047784, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029950151038403774}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e78cd0898080814d849c8e5ef1d75cd28bc503c4 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.01198445818204596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014260788140505474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.010220610766916988, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011465740207896803}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008620298324813997, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009283548591333689}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.00408044847073565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007407839704099361}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.003077457407067753, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005389627603175338}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002485343690964915, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0003747637651216558}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.009400832279577742, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011748774477986382}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.007826979829064936, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009041083010678055}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006554043722632426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007119999952117876}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.011417170592795792, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013642462305233519}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.00976396141526068, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011015780657958785}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008184567229279877, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008812784075419971}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 7.573420248556077e-11, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.1437041207051356e-10}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..97a58f048208b14c9a3065a937481dcace111776 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.037861086381951, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06836047096040862}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.1257432375112681, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019159382560102038}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.18063486945317253, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00237711509484684}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.13477982203492664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001743490061632216}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.021878282176526525, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006777122817529385}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.03895620866139208, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011682030964887294}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.02690877220249482, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008161465615669739}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.11986562004623494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017379166153133343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.17461605599457494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022693138087502593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.12945758884888567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016292910939932166}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.1053735479207649, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015856551771955404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.1530814011742357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002123300695392577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.11347069755170848, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015137881232935772}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ca94836a05163f15982da32f57ccf1c3cdb75d7a --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.764768704569181, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11681011094568629}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.31288412867432036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035427909765099854}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46936417321714036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028961231817524477}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.34038061566747974, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023257186137300534}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1402117253234874, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002153077295713064}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20877767235277261, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002142247790344424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1500686594700432, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001624535849202585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.24396944589446695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002544747084872626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.38145120151022727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024982824573944146}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.270217585005139, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016332773734661712}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.25613086398314344, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030892300737176545}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3831682600714934, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002726196482860545}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2779884368567486, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002138192348787855}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9f97659791280bf361409dbabee4b13c2a6f1e75 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.41120500785277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14503692197542128}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.41684922394706986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004186636542218429}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47779930312968993, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028899949460044045}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3989569396544033, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025486055461129416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20453973220943553, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027765650184713338}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2297748462000836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002235777047460442}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19154505382701745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019212848306377737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3203365038250148, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003202350372194666}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3812154925631381, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026289202235792435}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31054143071897045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019208559690267063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3478170949549396, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0037552677433117946}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39699062748706954, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027457154909683134}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3319800958678753, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002409947458257648}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..191a9fc43f36d90debc5f1af9eb25ae05d67c227 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.880715664128529, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17158352471095784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4639629612713196, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004177611070896573}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4774455798370461, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029485663296399648}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.424927708341804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025316898411008866}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.23283278901527085, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029068453764692073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23530804144636133, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00230529910790627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20921887509480042, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020302548686997627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.35446342612247117, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0033292098685381503}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.37515672755026724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002701550823819691}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.32731782950290034, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020370117438449557}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3894760454739483, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0037912675869163966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39999394338789307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028149429254385665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35633891933244893, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002452743956634602}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f425b94137b71a7baa3d79dbaa539fcb14362be3 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.706440636800545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.209905487839619}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5098369690867808, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004002567289168493}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4723686279223778, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002886704619921623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4506034619224452, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025013758070757588}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.25914289224620896, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0029364230874773197}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23707814882449188, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022913285376164904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22552802817973577, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020926553285697054}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3865808291729437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003296291222009853}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36535480455171704, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026413691146494386}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3432838504924204, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021170609002549544}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.42950005005772757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00369894339951879}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39785576817631046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002801132216535177}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3795767724760768, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024790158537510575}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7e125348737e0bd57e5e31edc96d42f592208bab --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.560518703918667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20359597948392913}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5478048955589382, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003646304257589862}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46181634864873156, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002829449684475299}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4693805908253228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023837935475695773}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2806797947585629, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028771642725867316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23273905795838107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022410883801735454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2367249143217987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021028372451803615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4171901160890622, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0031916851104158536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3533010090596969, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002512590327449297}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3569962031193146, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021217235757559627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4657607430277977, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00347449889738119}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39171419601830804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027144503350478343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3986616442882083, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002397258349962964}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1f4ceac02685a0567f0221032b9df55db1ae0400 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16555663520960512, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002350916031037813}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33846924006740337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004512241619274093}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.21252127035016277, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025864115571601924}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.036682960873275404, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012746186022009752}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0813578209176073, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002823258937880512}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04864427069781243, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016345379475366602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12383102079115851, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017944359589684203}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25531990108420605, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035961879286077994}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1593146627791285, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002005273521359136}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12887982173138354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018617251408736065}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2668104550207674, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003882126750149176}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16625220970284751, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021526107283535763}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1659375451775023, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08796273062555653}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fbd8e5a7fcb3a64967ecdf5ee0de82add1a439bd --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12191668255144995, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018744055949995327}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2959860856721735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004221609430843479}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1704938656510208, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025041299403158915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.024164572329844397, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009916021177288831}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.060891416073132976, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025613288257139185}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03416710366435938, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013987962350626175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0975659267221333, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001440048531173298}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2392357548644633, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003456319267315421}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13677834118995133, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019516199956448555}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09535036073703265, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014913950729399169}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23379176392496767, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003558139035756323}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13373022588407824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002029628375959834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.372878124069159, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10628208436225739}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a90f705174b1fafd277f0889dbd41a3554d2478f --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12401282957751562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018086229990670103}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3006971019571205, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041945785600752275}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17346901294999267, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024344080720837187}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026603501521828835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010223229811750628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0675828081201739, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002731130284560611}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03768828213738444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014534893459285194}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10355973612883328, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001465106697617734}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25260278092232574, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003565272166106387}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14506956673567722, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001994098811993386}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09503425023185773, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014299553564488096}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2329664126562576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035173823491549657}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13331847036755312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001956347470169085}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4427786967748797, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07197072253354266}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e329e877d03d6b022042861d0d7f2cfb15735d5e --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12214204871382313, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002084100128771504}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28246965413896563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004324995737850001}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16632335865304773, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025299739381817593}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02614942974783642, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010763157543408628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06368541200359151, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026337661338491167}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.036241177362694006, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014557689358685685}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10305700097987354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017645313615610096}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23979879495225828, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003771353003528918}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14060277612451139, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021501487866175113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09483807961662477, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017236941779501837}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22094049122854434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003657852505661345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1292272723627335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020721194526319656}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5156237113434763, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0631936029065487}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..360ddea592dfdf1106451e4cd83d52034d782e51 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0432285843007251, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028300766953997187}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07395689554615742, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004188070182507775}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04858663386480001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0027437547624381}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01020426047640163, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015103464507138337}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.016580756477888384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015144724892508722}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.010675959199877173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010064041044064703}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03572253309181341, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0024090282901972097}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06108738968000979, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034621309760131344}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03983479899100355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022280404596322053}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.034619579364571246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002407661648926437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05848663354465383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033818382426695753}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03823641847129987, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002188114108570348}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.750204076090565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09885266245065417}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0beded207b7d36b1b1e276d848f9def03241fecc --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/agg.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0031617466950151526, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009422468564219445}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0023901568791608856, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0006627590193091817}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002642223927312502, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007481596232712278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00043638381596206233, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002341700780478905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0002613738462795066, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00013420744260873104}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00032443951826456114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0001690966109579966}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0024195201987089257, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000713709556932369}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0018124786385441715, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004928032488930425}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0020200852307165357, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005643437419794288}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0026721155192842684, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008074535350699844}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002049243066915627, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005753193200840467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0022474009830527964, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006426778263930278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.959836607955245e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.7361993680103838e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..c661a1b65c47fbc68977962c16e1a9c763318349 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382b023958834de403446ada28a44fcbfeb8e89abd7de93ffa4cd21ae40dc1a1 +size 4103646 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..011efcab6f291c98befa7d598f14f36c416fa53c 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6f4efb1e3788f0925fc63ec8b0cd13740ff753999ffd8cd6c27c8a992620b2 +size 5076782 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..15a9e73055608e96a531cb0bb25bde279a7841aa 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f06dc6d9f48e22bd81fcf08df526ad1a645bd1e0f8a545e187cf034f9d6aa4 +size 5973359 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..0754f1221666c7fb1810d60ab64db63d43537ab1 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32185333f9a12c8e2b76d68b78895ac6840eda2f8c594729e16efd22de94609 +size 6887153 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f5b566539ec710c51bab0490ee9453255b3d1115 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b49a715c28cda2d018d620f157e40a438231e21979884da20aa309f6299120 +size 7795100 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..9ce62c4baea5c1e5ee0e673a787b070d44f64c3d 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f52e6e05281897f1543576a06186c77eb2968adf16d1560a55d5a389ccb047a +size 8712457 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..9e35d893f0bef4cf43156904ef6c633a135bf5bf 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11e94f17d42e9ca8328fa42c35219d8dc738c22e55d0c85681fdf0ad0dd9c25 +size 7677652 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..db7dca1fa52bd33d46277bebb7a48fc958e06c85 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:393c04b6d8885684fb5a9e20a748c75a9328dff9b9f2215d62f277765b00cf1c +size 13260268 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f605b4e54f20974fcda3e6434e598edfb22b3894 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd663c3334e4037668389dbf6436cbf8c99afc1720a23fc7e4c74c6a9f28c43d +size 18784885 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..30c52b44e2217ee8773155e84da26ece65f6c3d8 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c95feb90ab75302b39b8c4d4139ec1aaa98da15891bd2528cdd0db0f61fb6fc +size 24166503 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..5e1567f8fa4245b25ddbeebe2391eee7a2b9f205 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d36f371185cc312c3a29b6a1e09550f282b6105adaf6b64adf17f5451cdc8a5 +size 29409787 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..bd65f59002feacc721622de1cf986eabda2b28fd 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c344afe40a3efadd936b7869f274838911e0ece0c66b141e1bed619167449d +size 34786974 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f5aa018fe9be9acada64a6897b1e5b48ce39c452 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83143ed203128ac8e3cbd0d3e48d115ad38e70fb185f2a39cb430acaa4cdd352 +size 4241314 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..dd94bf307816d854dc26622d09ed7b36c393204f 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0929253ca59a06989483170729a6e5b1d9cb5c8ef3712b610a173b218271bafd +size 5436420 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..37b4c3957588c3247f2aea2598697d3143069996 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eafc9aababfa38020ea6d0af1e1e3a70d46a52736bab43467f6dfecec01963 +size 6370742 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..c94e2de46fbc96f5d992900a7116fee07112c37e 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d28b294290f1893f991311deb02aa354852ff105f997971b4c89f38b2baacc0c +size 7381580 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..eb9f30b2ebe4321f30de15def41ccacde217738b 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d10b5060ba90ab79870a9b466ba419241947ee15145ab6a88d7727044bc2404 +size 8387586 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..443daefe37424843c70d1bc74de3d0a8f1a99830 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65dcd296b4eb22d9a4c395e1678b05447f065eac81910f39d045092be44458f7 +size 9406652 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..76310d593de977cc68e8c5cfe4ce1301850d4c4c 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed3eb921002b2a8fcbfd898261e2961eec6ba107e22bf3310665e677aa18359 +size 2797630 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..d8d831d2854648362df808748b5cef0822d78a45 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b4c708f042f3bb11d4282277cbd2e993392fec07ff21fbe0d481847b344760 +size 5104435 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..06d5d493608251cfe7d0f10e418acd15527d124b 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f0ff47b44482f45d7b3288b2994974e1f7d5c2f0e10954000b2e6ab9ea1d94 +size 7378270 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f467665ece687043ed6bdd705db46fcb802c4ef3 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3ddb17eb0ad43d667ec5814da1d71fbf8ddda241f4e1585ad592ba270676be +size 9645409 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..afa60ffc06f06a63c9d4724294d6a0900c943539 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e857506f330e11d884209415a8e2e9998480f505fbd1331519a9f6b8b527c5 +size 11671724 diff --git a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.jsonl index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..da01060568e8ad83f8b10992bf391b2e41bf3aa1 100644 --- a/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.jsonl +++ b/4b284b42bc4seed1/evaluation/generation/examples.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e24a15ebc0040a94645a61c4f18e47da3085946b87373345b62601dcab5749 +size 13897442 diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ed4a5888033b6d0e3b22287e2d937809cedef3ba --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.35083434984315776, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02616449883888229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07739855446963606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018358644772690127 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3134763302724362, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0046471347446950095 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11399015240080852, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020851248767886823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.035905098524200436, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010607078653530643 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1502077023294116, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031613346908548603 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05371017651870693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013244390739921147 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07417060220648813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001718378357658079 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3043598891090655, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004514547231263379 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10951433816263247, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019234834216121733 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07397072360499893, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017528966784256012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2998529800959189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0043877961837816195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10883876337087849, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019507314452992279 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7ac8da59465ee13a27c5008d5ca2e70689b77493 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.46876992029559844, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.034927353982595874 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07681384925166049, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001374027323811084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38097873313953917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005175759754667372 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1197542888300053, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018385684763670012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03597310440100041, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008608280387754568 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18829701668248153, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003660067106053917 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05621234382196869, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011822787234320867 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07261876136034388, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012349384043881318 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36150967948798507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00480448094073723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11342676377933986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016697193247628803 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07302445423139715, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012977773718425825 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.360730723283117, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004772097268097439 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11374416895467514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017281592881802442 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cb12d7262a72132a018275039154a04cfb3be609 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5429004464487086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02956763370387551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0790589967959102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001308044694189035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39953213743199456, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005143398378070516 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12429985090438969, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017944563129484615 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03649208989958607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007894532891278444 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1981597561400995, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036947852288992844 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.057717005144251245, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001119756685357567 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07381899642907389, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001163187972748472 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3733176474539905, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004645414027325048 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1161186279960515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015898207130317827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07514756287869911, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012323384961919867 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3793258439410288, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004760005880194504 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1181098473843461, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016780964349225184 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5c2fd7d7612ca93476d7a0d81b22acb49ff026e8 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5793653489517963, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02573935152338816 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0784768409711552, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013293315467480962 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4021503169264519, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005139543525197391 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12359857437122666, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001817787926962779 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03647411331053875, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007983316045680896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20161790593954293, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037138076808761883 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05779858759830239, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001133882284527704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07257219968651211, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011559052093837042 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37199637183821616, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004566562333186737 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11438451893922211, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015822566905128663 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07439716631350449, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012402975601483565 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38041380356497384, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004723327182697422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11713401901641247, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016897910257232043 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..783cbcdde320c345e29527d8aea9f032466edea8 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6580262070232321, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04463702693525373 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07997151746529566, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013223612060855499 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4160976831278536, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005209059570687941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12642774404491391, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001811209169725992 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03735306573238954, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008065591123120885 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21078514701000953, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003845945929146538 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05943674402822863, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001148742985890239 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07356263456582715, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011493251347300905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38274283663424974, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004614058978267195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11634952210670316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001574306459194498 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07569528441100878, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012352346049956824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3931764824594323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00481151360289427 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11962749419116965, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016873346260864468 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e71936c77bbbc80834605761845f301334f0e0df --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6759695430973514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03994146869595565 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07937597458710605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001230884280609434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4260002708285773, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052002522148162 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12621183354053545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001677270665840144 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03663978847219582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007646406840406626 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21523323275826314, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003935924995816928 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05866875700675121, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010853175869745342 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07267084773310319, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010964268932708815 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38847122796901407, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004554143622718207 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11543687803885108, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014830311221567065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07511819509688057, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011627524680168457 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40224257158609245, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004821166920297295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11934454714588003, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015725681535582816 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4ed13130c2ebe88b1a5414692c62d2fceb7f2ccf --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1462918858923527, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018287969954442684 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2450504599773562, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002667661163946354 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17041087012324713, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018311684543931474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03005947880661307, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000749689945277961 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05347020409310686, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014364834441163317 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.035613930630312256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008591133723511533 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11532653680505218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001297865996200157 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20027220225980916, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002181258587442611 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13592634771209514, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001325717122146055 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13318256778490317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016411379474036579 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2245030731427097, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002442243276829025 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15540170480114518, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016434471793746518 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.510865468208299, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06679702254496858 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3623cb597d56416f63aef98448300ea4a9fc9ba6 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2084513743720111, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0027615910004934545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.29432626621828806, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028490942955253194 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21324165401751896, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001944169660478559 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.054478136936203736, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015417128687396466 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07498210243955587, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001693754544827238 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05258866077101279, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001046652141356547 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.15117682215157882, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0021453657954331753 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21535233109008273, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022267862814059763 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15295761707945213, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013211828510905123 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.19591291904991898, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0026104979706091298 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.277383576162133, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027253966450803695 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20046236036398457, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018314059922198284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.6743414261232488, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06424341960347561 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8019a487a775280ca872da9fbbb16d810d410e --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.24780130748953536, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003350152538855383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2849228433460083, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002870766788486399 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22139199215272853, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001986734930287734 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07110155096827897, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001996847414860468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07685904521692397, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017134959757600693 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05892704283287862, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001176092545801061 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1859776104589076, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0028381550119400733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.210091559089222, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022706467792696946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1619118803562238, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014796761111034566 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.23444040733713364, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0032065201609602226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.26987412705763364, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027419156490799167 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20929724279019218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018767292788178292 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.279744668462573, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.057469032972381 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7e90894e678dd8c189f122cde60f914334c14f2f --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22785972778596442, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004047623768336541 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.21841898213728125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032170855228152097 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17987775685234184, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024026596328742267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07010270751445905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002318540682504887 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05934134693437993, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016259409779823828 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04933111713020948, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012354318096556433 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.17649205283299266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0034189641055349324 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16398006288219888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025163218326892263 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13510911889705154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018509997343202566 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.2160404468571716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0038694496855073376 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20683146627158472, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030707094240185057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17018802287926738, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00227932442052096 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.235109631432272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10203278334805489 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1be927437908515c8196a96758232ad39354fd16 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.07304913048414251, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0030204336205108873 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06870413101811737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025879161404963476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05616898815912234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020232005142444298 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.022008239832194007, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0014678784297010139 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.018445977428777703, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001048282411460379 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.015260812067633033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008189899379778057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.058029662196145824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0025327184849280376 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.052447770497791445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020100089557701616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04302893844978566, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001564276452602402 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.06934359312412178, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0028948978002469477 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06475119031792104, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024457820594378753 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.052971475992559754, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019124004314651506 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.26810587841047784, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029950151038403774 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0781b56bdbead08c019e4d781ab54089572884fc --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.01198445818204596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014260788140505474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.010220610766916988, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011465740207896803 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008620298324813997, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009283548591333689 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.00408044847073565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007407839704099361 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.003077457407067753, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0005389627603175338 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002485343690964915, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0003747637651216558 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.009400832279577742, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011748774477986382 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.007826979829064936, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009041083010678055 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006554043722632426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0007119999952117876 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.011417170592795792, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013642462305233519 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.00976396141526068, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0011015780657958785 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008184567229279877, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008812784075419971 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 7.573420248556077e-11, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 3.1437041207051356e-10 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c6c8c18a7fae2ead847572c9dc364aabf2675e83 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.037861086381951, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06836047096040862 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.1257432375112681, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0019159382560102038 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.18063486945317253, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00237711509484684 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.13477982203492664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001743490061632216 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.021878282176526525, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0006777122817529385 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.03895620866139208, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0011682030964887294 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.02690877220249482, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0008161465615669739 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.11986562004623494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0017379166153133343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.17461605599457494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022693138087502593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.12945758884888567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016292910939932166 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.1053735479207649, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0015856551771955404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.1530814011742357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002123300695392577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.11347069755170848, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015137881232935772 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf78d0bbe4b340b96a47262c067a0db0309b1d8 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.764768704569181, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11681011094568629 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.31288412867432036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0035427909765099854 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46936417321714036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028961231817524477 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.34038061566747974, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023257186137300534 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1402117253234874, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002153077295713064 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20877767235277261, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002142247790344424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1500686594700432, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001624535849202585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.24396944589446695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002544747084872626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.38145120151022727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024982824573944146 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.270217585005139, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016332773734661712 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.25613086398314344, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030892300737176545 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3831682600714934, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002726196482860545 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2779884368567486, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002138192348787855 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..129b2ae46f706519f2eb4eca3cedc73d99c4954e --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.41120500785277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14503692197542128 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.41684922394706986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004186636542218429 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47779930312968993, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028899949460044045 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3989569396544033, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0025486055461129416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20453973220943553, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027765650184713338 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2297748462000836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002235777047460442 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19154505382701745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019212848306377737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3203365038250148, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003202350372194666 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3812154925631381, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0026289202235792435 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31054143071897045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019208559690267063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3478170949549396, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0037552677433117946 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39699062748706954, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027457154909683134 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3319800958678753, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002409947458257648 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..07342ddfd05f0b2c55efc611c3327c2727d5cbd7 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.880715664128529, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17158352471095784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4639629612713196, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004177611070896573 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4774455798370461, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029485663296399648 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.424927708341804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0025316898411008866 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.23283278901527085, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0029068453764692073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23530804144636133, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00230529910790627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20921887509480042, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020302548686997627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.35446342612247117, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0033292098685381503 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.37515672755026724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002701550823819691 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.32731782950290034, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020370117438449557 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3894760454739483, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0037912675869163966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39999394338789307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028149429254385665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35633891933244893, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002452743956634602 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..28d51f367c198a7c04556eebd7864ded143b4afd --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.706440636800545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.209905487839619 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5098369690867808, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004002567289168493 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4723686279223778, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002886704619921623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4506034619224452, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0025013758070757588 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.25914289224620896, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0029364230874773197 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23707814882449188, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022913285376164904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22552802817973577, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020926553285697054 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3865808291729437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003296291222009853 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36535480455171704, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0026413691146494386 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3432838504924204, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021170609002549544 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.42950005005772757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00369894339951879 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39785576817631046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002801132216535177 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3795767724760768, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024790158537510575 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c3417a2e9995184dcb1648f264e8894fef3ec99d --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.560518703918667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20359597948392913 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5478048955589382, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003646304257589862 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46181634864873156, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002829449684475299 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4693805908253228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023837935475695773 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2806797947585629, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028771642725867316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23273905795838107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022410883801735454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2367249143217987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021028372451803615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4171901160890622, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0031916851104158536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3533010090596969, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002512590327449297 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3569962031193146, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021217235757559627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4657607430277977, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00347449889738119 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39171419601830804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027144503350478343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3986616442882083, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002397258349962964 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..26ac40f8bb0d004354be85e463ea324178c29664 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16555663520960512, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002350916031037813 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33846924006740337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004512241619274093 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.21252127035016277, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025864115571601924 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.036682960873275404, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012746186022009752 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0813578209176073, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002823258937880512 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04864427069781243, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016345379475366602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12383102079115851, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017944359589684203 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25531990108420605, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035961879286077994 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1593146627791285, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002005273521359136 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12887982173138354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018617251408736065 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2668104550207674, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003882126750149176 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16625220970284751, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021526107283535763 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1659375451775023, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08796273062555653 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebaa9b7ad3f55f93b8afab4b87fb25c9e1f9e45 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12191668255144995, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018744055949995327 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2959860856721735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004221609430843479 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1704938656510208, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025041299403158915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.024164572329844397, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009916021177288831 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.060891416073132976, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025613288257139185 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03416710366435938, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013987962350626175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0975659267221333, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001440048531173298 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2392357548644633, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003456319267315421 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13677834118995133, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019516199956448555 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09535036073703265, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014913950729399169 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23379176392496767, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003558139035756323 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13373022588407824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002029628375959834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.372878124069159, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10628208436225739 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3d0596bed790e7dd9b300019c1db1ff8c5054025 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12401282957751562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018086229990670103 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3006971019571205, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041945785600752275 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17346901294999267, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024344080720837187 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026603501521828835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010223229811750628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0675828081201739, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002731130284560611 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03768828213738444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014534893459285194 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10355973612883328, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001465106697617734 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25260278092232574, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003565272166106387 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14506956673567722, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001994098811993386 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09503425023185773, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014299553564488096 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2329664126562576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035173823491549657 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13331847036755312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001956347470169085 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4427786967748797, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07197072253354266 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5dfb75729fd63abe590241dbf6fcfd0d0ff0164b --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12214204871382313, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002084100128771504 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28246965413896563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004324995737850001 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16632335865304773, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025299739381817593 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02614942974783642, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010763157543408628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06368541200359151, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026337661338491167 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.036241177362694006, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014557689358685685 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10305700097987354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017645313615610096 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23979879495225828, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003771353003528918 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14060277612451139, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021501487866175113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09483807961662477, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017236941779501837 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22094049122854434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003657852505661345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1292272723627335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020721194526319656 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5156237113434763, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0631936029065487 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..fbd1ceb72e3121dcb9efc2f6afcf3e1c6171743b --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0432285843007251, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0028300766953997187 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07395689554615742, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004188070182507775 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04858663386480001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0027437547624381 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01020426047640163, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0015103464507138337 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.016580756477888384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015144724892508722 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.010675959199877173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010064041044064703 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03572253309181341, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0024090282901972097 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06108738968000979, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034621309760131344 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03983479899100355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022280404596322053 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.034619579364571246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002407661648926437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05848663354465383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0033818382426695753 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03823641847129987, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002188114108570348 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.750204076090565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09885266245065417 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..64d97074d6e3f8e91ccbb4c9821166804ffff8f4 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/generation/slim.4b284b42bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0031617466950151526, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0009422468564219445 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0023901568791608856, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0006627590193091817 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002642223927312502, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0007481596232712278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00043638381596206233, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0002341700780478905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0002613738462795066, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00013420744260873104 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00032443951826456114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0001690966109579966 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0024195201987089257, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.000713709556932369 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0018124786385441715, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004928032488930425 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0020200852307165357, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005643437419794288 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0026721155192842684, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008074535350699844 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002049243066915627, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005753193200840467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0022474009830527964, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0006426778263930278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.959836607955245e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.7361993680103838e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b42bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9476da3d1b11a47cbd576c8c5a6e94abf5a58e76 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402702 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433625 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.47998406691894047, + "acc_stderr": 0.004985781620467009, + "acc_norm": 0.6341366261700856, + "acc_norm_stderr": 0.004806870285747303 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.013901878072575055 + }, + "storycloze_2016": { + "acc": 0.7161945483698557, + "acc_stderr": 0.010425696279730926 + }, + "boolq": { + "acc": 0.5871559633027523, + "acc_stderr": 0.00861117243047287 + }, + "arc_easy": { + "acc": 0.6102693602693603, + "acc_stderr": 0.010007169391797051, + "acc_norm": 0.5260942760942761, + "acc_norm_stderr": 0.01024580199024005 + }, + "arc_challenge": { + "acc": 0.2696245733788396, + "acc_stderr": 0.012968040686869147, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382316 + }, + "sciq": { + "acc": 0.852, + "acc_stderr": 0.01123486636423524, + "acc_norm": 0.764, + "acc_norm_stderr": 0.013434451402438676 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568793, + "acc_norm": 0.7627856365614799, + "acc_norm_stderr": 0.009924694933586367 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0_lm-eval_global_step80108_2023-02-26-01-49-43_0shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0_lm-eval_global_step80108_2023-02-26-01-49-43_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..9476da3d1b11a47cbd576c8c5a6e94abf5a58e76 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_0_lm-eval_global_step80108_2023-02-26-01-49-43_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402702 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433625 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.47998406691894047, + "acc_stderr": 0.004985781620467009, + "acc_norm": 0.6341366261700856, + "acc_norm_stderr": 0.004806870285747303 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.013901878072575055 + }, + "storycloze_2016": { + "acc": 0.7161945483698557, + "acc_stderr": 0.010425696279730926 + }, + "boolq": { + "acc": 0.5871559633027523, + "acc_stderr": 0.00861117243047287 + }, + "arc_easy": { + "acc": 0.6102693602693603, + "acc_stderr": 0.010007169391797051, + "acc_norm": 0.5260942760942761, + "acc_norm_stderr": 0.01024580199024005 + }, + "arc_challenge": { + "acc": 0.2696245733788396, + "acc_stderr": 0.012968040686869147, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382316 + }, + "sciq": { + "acc": 0.852, + "acc_stderr": 0.01123486636423524, + "acc_norm": 0.764, + "acc_norm_stderr": 0.013434451402438676 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568793, + "acc_norm": 0.7627856365614799, + "acc_norm_stderr": 0.009924694933586367 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..85fbcad10703f141d67b10fe2a1e733805c364a7 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473486 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874087 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3489401351036571 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4761999601672974, + "acc_stderr": 0.004984125363319069, + "acc_norm": 0.632742481577375, + "acc_norm_stderr": 0.004810723108378211 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5919494869771112, + "acc_stderr": 0.013812822643745028 + }, + "storycloze_2016": { + "acc": 0.7071084981293426, + "acc_stderr": 0.010523873293246309 + }, + "boolq": { + "acc": 0.6103975535168196, + "acc_stderr": 0.008529228894936292 + }, + "arc_easy": { + "acc": 0.6144781144781145, + "acc_stderr": 0.009987250004629022, + "acc_norm": 0.5761784511784511, + "acc_norm_stderr": 0.010140006095213606 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.3054607508532423, + "acc_norm_stderr": 0.013460080478002501 + }, + "sciq": { + "acc": 0.89, + "acc_stderr": 0.00989939381972444, + "acc_norm": 0.861, + "acc_norm_stderr": 0.01094526376104297 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1_lm-eval_global_step80108_2023-02-26-01-49-43_1shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1_lm-eval_global_step80108_2023-02-26-01-49-43_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..85fbcad10703f141d67b10fe2a1e733805c364a7 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_1_lm-eval_global_step80108_2023-02-26-01-49-43_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473486 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874087 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3489401351036571 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4761999601672974, + "acc_stderr": 0.004984125363319069, + "acc_norm": 0.632742481577375, + "acc_norm_stderr": 0.004810723108378211 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5919494869771112, + "acc_stderr": 0.013812822643745028 + }, + "storycloze_2016": { + "acc": 0.7071084981293426, + "acc_stderr": 0.010523873293246309 + }, + "boolq": { + "acc": 0.6103975535168196, + "acc_stderr": 0.008529228894936292 + }, + "arc_easy": { + "acc": 0.6144781144781145, + "acc_stderr": 0.009987250004629022, + "acc_norm": 0.5761784511784511, + "acc_norm_stderr": 0.010140006095213606 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.3054607508532423, + "acc_norm_stderr": 0.013460080478002501 + }, + "sciq": { + "acc": 0.89, + "acc_stderr": 0.00989939381972444, + "acc_norm": 0.861, + "acc_norm_stderr": 0.01094526376104297 + }, + "piqa": { + "acc": 0.7470076169749728, + "acc_stderr": 0.01014288869886246, + "acc_norm": 0.750816104461371, + "acc_norm_stderr": 0.01009188277012021 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1fa6323900287f4a87a0555bb035647d60e501ef --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055235 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002514 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2854808590102708 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.474407488548098, + "acc_stderr": 0.004983240744101372, + "acc_norm": 0.6302529376618203, + "acc_norm_stderr": 0.004817495546789556 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.0300523034631437 + }, + "winogrande": { + "acc": 0.5714285714285714, + "acc_stderr": 0.013908353814606679 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6110091743119266, + "acc_stderr": 0.008526800159503209 + }, + "arc_easy": { + "acc": 0.6241582491582491, + "acc_stderr": 0.009938436373170637, + "acc_norm": 0.6031144781144782, + "acc_norm_stderr": 0.010039236800583199 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.013406741767847626, + "acc_norm": 0.32764505119453924, + "acc_norm_stderr": 0.013715847940719344 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151115, + "acc_norm": 0.884, + "acc_norm_stderr": 0.01013146813875701 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858917, + "acc_norm": 0.7562568008705114, + "acc_norm_stderr": 0.010017199471500609 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2_lm-eval_global_step80108_2023-02-26-01-49-43_2shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2_lm-eval_global_step80108_2023-02-26-01-49-43_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1fa6323900287f4a87a0555bb035647d60e501ef --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_2_lm-eval_global_step80108_2023-02-26-01-49-43_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055235 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002514 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2854808590102708 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.474407488548098, + "acc_stderr": 0.004983240744101372, + "acc_norm": 0.6302529376618203, + "acc_norm_stderr": 0.004817495546789556 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.0300523034631437 + }, + "winogrande": { + "acc": 0.5714285714285714, + "acc_stderr": 0.013908353814606679 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6110091743119266, + "acc_stderr": 0.008526800159503209 + }, + "arc_easy": { + "acc": 0.6241582491582491, + "acc_stderr": 0.009938436373170637, + "acc_norm": 0.6031144781144782, + "acc_norm_stderr": 0.010039236800583199 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.013406741767847626, + "acc_norm": 0.32764505119453924, + "acc_norm_stderr": 0.013715847940719344 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151115, + "acc_norm": 0.884, + "acc_norm_stderr": 0.01013146813875701 + }, + "piqa": { + "acc": 0.7568008705114254, + "acc_stderr": 0.010009611953858917, + "acc_norm": 0.7562568008705114, + "acc_norm_stderr": 0.010017199471500609 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..14301981e5d69ae67b87370e99b17d663e745da6 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077245 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2867458653622175 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.4778928500298745, + "acc_stderr": 0.004984901752846398, + "acc_norm": 0.6357299342760406, + "acc_norm_stderr": 0.004802413919932651 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5808997632202052, + "acc_stderr": 0.013867325192210109 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6278287461773701, + "acc_stderr": 0.008454434247373898 + }, + "arc_easy": { + "acc": 0.6296296296296297, + "acc_stderr": 0.009908978578665757, + "acc_norm": 0.61489898989899, + "acc_norm_stderr": 0.00998521479873725 + }, + "arc_challenge": { + "acc": 0.3054607508532423, + "acc_stderr": 0.0134600804780025, + "acc_norm": 0.318259385665529, + "acc_norm_stderr": 0.013611993916971453 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151098, + "acc_norm": 0.9, + "acc_norm_stderr": 0.009491579957525068 + }, + "piqa": { + "acc": 0.7535364526659413, + "acc_stderr": 0.010054810789671822, + "acc_norm": 0.76550598476605, + "acc_norm_stderr": 0.009885203143240538 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3_lm-eval_global_step80108_2023-02-26-01-49-43_3shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3_lm-eval_global_step80108_2023-02-26-01-49-43_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..14301981e5d69ae67b87370e99b17d663e745da6 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_3_lm-eval_global_step80108_2023-02-26-01-49-43_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077245 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2867458653622175 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.4778928500298745, + "acc_stderr": 0.004984901752846398, + "acc_norm": 0.6357299342760406, + "acc_norm_stderr": 0.004802413919932651 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5808997632202052, + "acc_stderr": 0.013867325192210109 + }, + "storycloze_2016": { + "acc": 0.721004810261892, + "acc_stderr": 0.010371620932652793 + }, + "boolq": { + "acc": 0.6278287461773701, + "acc_stderr": 0.008454434247373898 + }, + "arc_easy": { + "acc": 0.6296296296296297, + "acc_stderr": 0.009908978578665757, + "acc_norm": 0.61489898989899, + "acc_norm_stderr": 0.00998521479873725 + }, + "arc_challenge": { + "acc": 0.3054607508532423, + "acc_stderr": 0.0134600804780025, + "acc_norm": 0.318259385665529, + "acc_norm_stderr": 0.013611993916971453 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151098, + "acc_norm": 0.9, + "acc_norm_stderr": 0.009491579957525068 + }, + "piqa": { + "acc": 0.7535364526659413, + "acc_stderr": 0.010054810789671822, + "acc_norm": 0.76550598476605, + "acc_norm_stderr": 0.009885203143240538 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..760c83b8612d4e2b93cc86a65cfa58c747d2ab43 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.365, + "acc_stderr": 0.015231776226264893 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.35333333333333333, + "acc_stderr": 0.013804572162314918 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.27761904761904765 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.4761999601672974, + "acc_stderr": 0.004984125363319068, + "acc_norm": 0.6354311890061741, + "acc_norm_stderr": 0.004803253812881048 + }, + "rte": { + "acc": 0.4404332129963899, + "acc_stderr": 0.029882123363118716 + }, + "winogrande": { + "acc": 0.5872138910812944, + "acc_stderr": 0.013837060648682106 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.01031606278759001 + }, + "boolq": { + "acc": 0.6269113149847095, + "acc_stderr": 0.00845866125205838 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.009894923464455183, + "acc_norm": 0.6182659932659933, + "acc_norm_stderr": 0.009968648851839675 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3302047781569966, + "acc_norm_stderr": 0.013743085603760426 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745918, + "acc_norm": 0.9, + "acc_norm_stderr": 0.00949157995752507 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7606093579978237, + "acc_norm_stderr": 0.00995588425029169 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4_lm-eval_global_step80108_2023-02-26-01-49-43_4shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4_lm-eval_global_step80108_2023-02-26-01-49-43_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..760c83b8612d4e2b93cc86a65cfa58c747d2ab43 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_4_lm-eval_global_step80108_2023-02-26-01-49-43_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.365, + "acc_stderr": 0.015231776226264893 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.35333333333333333, + "acc_stderr": 0.013804572162314918 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.27761904761904765 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.041633319989322626 + }, + "hellaswag": { + "acc": 0.4761999601672974, + "acc_stderr": 0.004984125363319068, + "acc_norm": 0.6354311890061741, + "acc_norm_stderr": 0.004803253812881048 + }, + "rte": { + "acc": 0.4404332129963899, + "acc_stderr": 0.029882123363118716 + }, + "winogrande": { + "acc": 0.5872138910812944, + "acc_stderr": 0.013837060648682106 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.01031606278759001 + }, + "boolq": { + "acc": 0.6269113149847095, + "acc_stderr": 0.00845866125205838 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.009894923464455183, + "acc_norm": 0.6182659932659933, + "acc_norm_stderr": 0.009968648851839675 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3302047781569966, + "acc_norm_stderr": 0.013743085603760426 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745918, + "acc_norm": 0.9, + "acc_norm_stderr": 0.00949157995752507 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867483, + "acc_norm": 0.7606093579978237, + "acc_norm_stderr": 0.00995588425029169 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6638872f19c23fd7331cf79496b74bd6b75c7dd2 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798596 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404798 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.32688172043010755 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4774945230033858, + "acc_stderr": 0.004984724235115124, + "acc_norm": 0.6384186417048396, + "acc_norm_stderr": 0.004794764843685285 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.01390187807257506 + }, + "storycloze_2016": { + "acc": 0.7306253340459647, + "acc_stderr": 0.010258997754057014 + }, + "boolq": { + "acc": 0.6223241590214067, + "acc_stderr": 0.008479309208281646 + }, + "arc_easy": { + "acc": 0.6384680134680135, + "acc_stderr": 0.009858506543162063, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493126 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068754, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946526 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.00896305396259208, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491122 + }, + "piqa": { + "acc": 0.7431991294885746, + "acc_stderr": 0.01019286480227804, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858914 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5_lm-eval_global_step80108_2023-02-26-01-49-43_5shots_backup.json b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5_lm-eval_global_step80108_2023-02-26-01-49-43_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..6638872f19c23fd7331cf79496b74bd6b75c7dd2 --- /dev/null +++ b/4b284b42bc4seed1/evaluation/rankeval/4b284b42bc4seed1_5_lm-eval_global_step80108_2023-02-26-01-49-43_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798596 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404798 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.32688172043010755 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4774945230033858, + "acc_stderr": 0.004984724235115124, + "acc_norm": 0.6384186417048396, + "acc_norm_stderr": 0.004794764843685285 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5730071033938438, + "acc_stderr": 0.01390187807257506 + }, + "storycloze_2016": { + "acc": 0.7306253340459647, + "acc_stderr": 0.010258997754057014 + }, + "boolq": { + "acc": 0.6223241590214067, + "acc_stderr": 0.008479309208281646 + }, + "arc_easy": { + "acc": 0.6384680134680135, + "acc_stderr": 0.009858506543162063, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493126 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068754, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946526 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.00896305396259208, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491122 + }, + "piqa": { + "acc": 0.7431991294885746, + "acc_stderr": 0.01019286480227804, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.010009611953858914 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4faf4b238987085842a1b2c14b77a651232aa9d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c09344aa02d6728caa7c827db047e1a204a1b7ac9fe4b00e070aaf8df081dd31 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10fb462f1bafff7000c5ae9970c5dbd2e79e74f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd95067b8c7e0e52b363a790bc96ff794765fc78c871762fca150069bff1cd8f +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a0363ce8992c38814fdb22560ddd239a119b14 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdb2abcf7c4a981e48d7f1ddf67b9c0fc468b15da8ca27f48b12ec1abe813503 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8309094679a188db2d57e22cb9d0709a40033090 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61e510f53e495a9e98e8beefef5ec21cdca15a82dd3efdf1a40a163857421c2 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18dc4731e971e03b82dc4d70c9eedfc7c89d876f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97aef6e9f2c9c553c8fbd81c69de83f8bc4f03f8e330479dfdccae259cf25a7 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df9af98ceb1b3ce1c43399e797f4601c82c04c65 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dec4de2115471b8461f55486a0e6a0a2fb346153f66b46122d4e58d594cf07e +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031a75054a94fcb0430befe2fb4620202f909761 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a7c2a766e3befb879a764214f8ec2863e2bfc4704a7880995431e041e619eb +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce77c8dd679b957dfd583404169f57af5ffcfe75 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba864c6acea660f325c29d006f982630b86d9c8c482777a8dce40aafb69745e0 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ad4c72a3d3a3fc42077e77f0d6bf869a0aa74aa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8232594aa0d48ace341e09cdb9da2f807b6ea5b14f0a42b32238920c770d0f69 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c7900b90aecd7129f08f7bf18379b19526f161e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e577580ce8fe146af971e0022951f118ea01fad402cd923d428168ec7a4f52ed +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a3aafd29774179569688dc38d38326f5b467323 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82adf40a60109a9c06182b74e71609119a3096b6c86d5b4ec7d713cbaf14b60 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7176f3dd89c68d7c2534d2aa611c561e519fb43a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9001a7bdaaf6dd1a912019fcac2a04ec56f128faa2829045db91a0acb9220fb7 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45869b404c974a2a05b08627cdeafa1785a4834 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab74eb7cb8754eca00871ceb85e0269638d6e9f463fdbb1ccc5220994797aea2 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa8ba4a2c9c5c1854530f9a5556d3b0b4956399 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379c93aa28ae6e5f7c4ee9623b9f793021ad9c42219cd5a969222eeb7103ce5a +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b09d8871ee5834a94511a2c9884902f45882a6c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01431f4c8685a9b6fa070684307af5fda1448a3e46a4d866df5f7ba26d248631 +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1cd0c1e684851ba9561b1c0724564abbce490ae --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1aec01fc2ddd4beeeeb55040c5b8364a8864a4a0eacef6fda45cdb6fe1cc9d2 +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a479bb19ca82e49984209342e18c4ce430e42a36 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077db7c991b5a74e10405557e4f846d786614bc4cf2fa73332e408cb28398492 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2cf71160c8ea763a80d64f2f582dd6b3d80eb01 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c606d12dba2f735e93fcf970013ed4489090b763c5bc0ba70b90f95b377982 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9482e8ad4534474f58d48e2eb3d94d5924c591b2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b276535c36f4ae8623c34c2210f36301b05bf5a1117bdddfdfd51ead65543a2 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1850690e15d36b37ac08a0359abd132617df8b6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d9329b5a90248f11fa1f925e11cecedf3faba6fb46bcfdbe1e2fd17d507040 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbab86cf5c07974f3c49d6721158bce747f57bf0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4400640a7ee07d9ff75b15c89f285a0c1d5e9ad388d2cc05e972743d45384e0b +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6cf4d2e7f83b207d811a6ec8aa90f5ee9142926 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b50931ab31b33fd720106ee38f8445e00e101826c25fb3d10e0f3cee6276722 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9571da50e2093ec0015fb550c4feb057eb2eed9f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02feaf167fdc563bf39c1cd957c720b72e1f8cad5b4248d6fadea7bcd2ce1c5b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b840e95f9b3b7abb6eadcab1e2cd5bae834dc4a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395aed363428239e6c5ca1994e119533c635f6c6baa62a018ffda186599fca61 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f554b56f7b529efc8f4ac2c3e4bfb7174e8385f4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4cfc3d704d7abade0f0cfa6b5396d86b03416f48329e23374933de322d80f8 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd0f0c006458d3959d8d94f805ecb795c263d46 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4104acaedc08b98421c01ce250f8d1075e23aa243dd86f350f41e9a86ad487 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dabe2a110339a308c5ed57df461ba3ed8796c2d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d92a66a5dbe13c8b863c68c6691f9f5c65e8019cac919717cc4378e2ae3074 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..792b821dfbfacfcbc4aee7fbb6ceb005508f6909 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdb7ca143a0a68c90530a54bea83644add76ff2262c06ac76f7356a0e23f9335 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec51706cfa242ec3b9758430082abdf480c16ee --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b2ea48f29fc3c25da4aec38a55bef82cf9758ab789e422ddd4dc305c3350685 +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c233d701c55f38d6163b1d49da5cd4fe7aee102 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc00985212e110dbd093518313dee1eddccae8458ed98f8cc510e2529b27b04b +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eafe840d94049aa773fa331f9a2a7b7ac03086b8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7a2a87e4c4ff27221c5eed31a5197f86a678170a28f656a35cac25a5374cce +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec9311336767eeac90705492699345d2ea9143f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2f60c21b4a7619aee1bc634d5f405272d2597a0c7bd1a36d8e0a57812acc5e +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4fbfd7b4457f5b1b003f0e72f7f6509f02e1fae --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014f903429c5ddeb69ce93539d8c655df580ea4c0c84f1624cbfcf590a4fa815 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a0adb391ed1b795c5ef2f6e6b8abdc26b4108c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cacb0a1022dc38879f9976881c8aad83167c0880497e511f18a14b408e6a2554 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f634957accb1dbbf325627500e41163097e30b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c713fe867d4d6339267e386198a7599330326234bef04c85fc8b6737ff4368 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d152e3eec5124cd54374aa066d3d91609b517075 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03673b56e9c3e52933006291e6e0aa2cf6c3432a5dd1aa2467c8ac10eac014f +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c694d2b974605dc3e59d70925289a4f21650f6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcecb925243396b30d40cfd21bce97ba8feff81bbe9d69e56673475519c6cc7d +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fc9dcf67fa63fddaaa1f940679b53c7cf916deb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67d7a40970c3678e117dd347cb80e43fc672a28a81a434cbc5fc9f72825ac83 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d11e094a8da73308c0b8911bbec49cfe8df5577 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d7e2b94cec18c35ed2b45c95b6da3355c7961f92a1bec82e378921d95227e76 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f115b995ff5bb98ffa16a055df872019b2a78b02 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aab25d51ac78b4aa9ce16e319ae573b0b6947e45f34a981b57e6a49a8ac1167 +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b58c3fa66cf6a97034ceb33b30bc52290585c767 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823085e8b470bf8c1cf7ff35bc31029e3fc5a3b0141efe916d45dabc410e4b96 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a988f859a16c842f0799dea6daaca286af6b38 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116129a158bef8432ea5db20996a069ed52d7b4b8cd513f29d8ade8e5c1335b6 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f1450400add64c53a202b24acd688e8fb9e2a0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0085b615ec849f5ebf13e8d2c6457a4f31421e8d8495ace1f0d49495be9fbdff +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1895d2a9613f0e404cf8f9de5db1c15b19f8403e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632e0b07f8ac817a42338516752527275cf2e9dd1ca5f14c481cee101bf711d1 +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce412794a545c933da7e517010bce5805d38ef66 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b09a82a5c49d395a374e841ec96b81adbbee8e2dd4f039bdd6814f9da5a6d30 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df669856fdf7922e0fd02f3a78998e9a8f375a9f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8840a676a03b68a4fe9f2aa063a0fc82f07cba0234d0577bf58e0055169db8c2 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ded446b536ecc72f07435a833ceb7b29f207ad8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c19c7f02fe34698e1baf3137865aae51f352c5d5f14c0ca86f5e613849c6de9 +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa684a470e975c913d80c0f14ab00cb042800ccd --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd05909e46a752961cfffeff8df29dbea70407d5731bb226945b8f30bedb8e0f +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fc17217d4012f3ecc3a61358ab8f32a92cd5fc1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70435516a51a9d39057142879af2472f79d909e826e66e932106a8adcf0ab07 +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df514b7e24eb39a9fa7759989103b64a08d1dc53 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3694289dc85d5e2e069064399efd5aaadbab86e9a0e01a762d1f10ec062fe7e +size 199058797 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e064b54eac28e0abe317d33d3926fca1b4e5f44 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30d689adfe50a435c93152fe7951f7a6d7ad6d905fd444041350eeb7284464a +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2497ee02b2df6664570603cb5cf422f9bba5786 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64af3c035b004f10997b76836cae4387dfeabc2bcb992c589c992a0725e1e85b +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bcf69b8cd7a424495f79746e6f7c0f7bc6e6632 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d677d2db14a53b94a78c334d01e646197d7d2b5db736fba91f30604b131f91cd +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a00f532dc6595605ec707c62b55ab1b76af3d44a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193d6872d3041a460aecd271f3381566bc34942c01b9b59fe59032f34f7fcfed +size 199058733 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1eab72f253a734df556bfbfe787c5e98a83f5f3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d4b945345ef75623f91e89354eaf40d21a7f8995e492550cd3c9dc7166d8db +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d64eedb920a4e9bfc79d1fcb5e2110852ee211 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f2f8ef8598ee2c5fef24d0731685595ab5c99bf04ca995b2f35b939bba35c8 +size 199058669 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c55f33c2569f36fe3c5d8ce8f6307a132c5d751 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b969b369ad54583b7f29be70e1270492990dcd58b2f35e1bc6a5c3922249d59 +size 199058925 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b607f17a55e4f61fee97bbee30a2992dda2d8a98 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1c41f7f34b4f7b84a88946eacf388dbf9246be64559a63d02aaf7f5e3d8263 +size 199058925 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..231d036cf98c65101043274fffd2ae3f5f7e824a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0381615a6d83f74451f74ef38ee27f76332a2231eccff8c3956969808510dc07 +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac64c82279e084745b6507342fa0d12511bbf88 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd63873b0cf001297888f5e62b7ce83b781f72dd2292796774014b265443c86 +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..803a9059e9b963eac6bb8a74d31dfcc89f44e004 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ddde9b2691b9804e389a4ee114792a95a5326ff7d03071eff810535c96e132 +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd0f84a1cc285589e15f80e05fe9d813db7a0791 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8333bcb66f7c0512ae200fc26c6304fdaa592acfac6a78de2fc0a20fa621dcf2 +size 199058605 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f14682bcc47fd6ecd2022b233dac2329e7fc5398 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89006c31e937d5abd15e58d9b17f1048dd181ecb4a173f903197d660f415b269 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b164ce5c7c28b052b2df43eda859e9e091df19e6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d204526b64a70e503276032d0fff29af6f7b0864b8e92117ee08f76bd421b2e6 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50285ca7006c546c96f26f62dfb91174cb9fe15 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d49a444e5c5736f4005ccbf0c074b4a41c8a1c497b75d857fd7b19025927b60e +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4292a6ba1f358807d1aea856066469530e509217 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f58074422a697fefa59de5a7ab9c372d4f8558e755fa4b7fa264b1391e7a8e +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..869550482421027a81d1a8e12716e734a3dc8981 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1ce8e6c08cdd46e6a606aff4e80b9afaa468c7822da80bca851c837eb81a0a +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f5b5374f3b0266ad3975762d92f813de0c427ea --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34810d7ca5edd8ca577f742c29032b48bac7ccef784888ad92f671e348a82b05 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e19a102a60796e0c011980552b7c2d4d0b96c2c1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92cf49a73f1cf17f0346057641c3520a04218e9f782541261a10f07061dc3046 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce498461428d423b6715f2a115d4acd5b930dd2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36d55e87337c0ee1df11f2101c012512cbc77b673569df8b7726cc068822a1b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba9c927f4dd8de1b7c9e1d30d8839035c1681a5 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6867a2d6705349fc234e99d46f832ce73d72b06315377d1c10666b91e4e09a7f +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff04577a9cd1344f9e1e520ebc1ef4c5081d27e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9177b7807bf2ab4515a3e5bc78f9e13071a3ce3aaff2c09aff61af6102f5c02f +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c520d09cc586ac82f91aaf54dda79ccf00e81b9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cbd7a7d27c7f4979ce892db211106de0f48ad3f2f549d8b4f4fdea1d9f288a +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7798e861d76d4bb06955671ab18012f5a10d245f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a745671e5490e69fb83d4efd4f8a941f024de1f3b835cbce7c33e4b56511ad7c +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..436356ddad16bf84be00e27aed0b8d82474bb850 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a092d4c5eea1003ac94a61ce6666241c9980a3df0991948d275d4cbcb20177 +size 199058978 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1417e71abb2499473115a319d8436943f7dd66 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f8ea318b2b629f5ad916728f83f70754001b5e7e4ffdbec0bed30513edd8bf +size 199058978 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de76eecb2b4c29be2034b38682b93e6ddea35ecd --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752080d494a7b2be9e9796f047221b887d32700a021d033a1044953c36346a90 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..038f08071a28df365c3bf0a83decf8177e27860f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea309427a1a59ad9090a8307b033b6b15fa9e206b64a4046671a4c3d764d31b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bcef2cc57b34d424939d529c0abcdc13e3d83bf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466fb1621217ec124c4c91d3a81f6af6d49fb2efa4aba58f7883e4dd4b0bbed7 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b350b255276e50ddf20d420f28cf3dd9ed9fd84 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d837ff6cb95361bc0efa57bc6e60836c7dd850b9e9ae27a1c366a6f5e41c2da6 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..732b6abc2f03a0324a172a860a3b7e0893b232cf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5874ed96619b7e56e0653ef27556ebeb31ee0c8e6583223230f60b05b4d3f9 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe49eb78e1e7ae9d1be3fc346a08353dbd06be4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f13984492661e248bc367152d491b97d8e0acd405a71a4b554fa708517251146 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4135e20facd80eefc544faabe23bd53e076c698d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71829115d3ceeed7ad845318fcb2459c795a7c0d09b14c2cd0a1ce1e4f6a873 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaefae752252dd8f8559c7c7267df8bf417869d0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073b1ed4e74dba50286bdde2ee5c20a607406342d1c77df0260b448ce095f1bb +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db5d3b0f453973e3f92a823d1816b78486241aca --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8548a065ed25fbf6e6d53de3649f807001b719f0465d84670fa08655aa8bdc +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca626954eb14731cf0606d1dbf6466620317a52 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b749be3ab66e2dc4c1b6830cf2d4aa7f548c9382e7af2750ecdbff637846672e +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bf6fd99aac9977ed57caf9f922ddf689cafdf3c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236e1a103302f92d942ec45401cace9c70d7a9d6497089cbffc8cf83bd55bfae +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67167fc97bb5b7f89521c4ae270bfe8628fdd72c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b36dcaae4149d0564ba45670845eac60434ed4afcf1b442b89477b7eef8fa7 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..657fb3ca637e068c3c288acd246a3802c44a44bf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7731d6ee072b12da194101289e9d4d1e79c9a6da29fb0baf43ce24da44f78e8 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3552f5ef91d712b2a5dd9e9958e63d36e165a0a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8da75a1071c309b00b80514161cebd87900346cdf31ddb520e9437e2e0f2339 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5153cf5b641276e43dca21695dd6c72f7d6b1f17 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3072f0738ca6c208d00296430a4e6e92e74d2d44e321470273e180c35b8b5e32 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d63b4e512541caaae635980ab555ac07c2d8d081 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:158842e5a73cfe0bfe4ed2887f365de475a8feefb67c2624063df2a8116f0bf6 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a645d73d7f10481f06ecc118a433a7a3777bf710 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1dc414135bbaea182026fd84391729ce044f1cab400f707059f1758e8fc92f +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1821047bb0624fc9270eb8132912d043dcf74dc5 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebec1c764de879aab8f0f9c8354c90b6822d5f7e28f70a6c1185f53e5ebb4ed +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fc3c188c4a343473e03e1c6a75a3fd9c672fc8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0f18efcdca94f82308ce16148942fbc6f0fe50d049eacb79fcbce5d031141e +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19477c5033d7baa633a0db857876db5e62e464e4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebb4c56f3a598a322de764027735c80c2a21a6761badabc49cd145e86078a09 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7281afc655ea3f528d6107e9b0f86a3818c8751c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24acc87ebbacad53b6816e8d82fc41e26c1ed99dec0a2df3af139f7e9a11f9ae +size 199058594 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0343b19fd2f28c34ee356e013c2d0cdfc37565 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da095241c653bafe15a9430794a5937c491aad9fa47ac1e8d206b3eae874c99 +size 199058594 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61dce231f12518c16e64e0da7f305083805a384d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3423ffc92c96d08428880c7be6f081d8478055ed24bf2d517f2a57b7060be573 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af531348728a93dc0d6207500373aad98bdbb25 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f17efaaf3386211008d15fc02f9807be38b5af5d8936b08dc9b7001d1ddbd8 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb5af304251bc3cc1f87002386210bfbfa215e1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583372e72c789084d4cec885cd87a535e3459829e9c9dfb45cae0f03970e5ba4 +size 199058711 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75da37c75b5666659f47edbda8ea66079a7be6fa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a65b5a283445b12e31ebd8d29fc0c82eac556698aedcdb448c2c550e9dd3fa +size 199058711 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14dd8bc7c4aa68c7c439de672e7aa36cddf9dd4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da2c3637fe6738eac032952a62b4070fb198942468085c2eac421a89ede6ff3 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88efadd9cda2c142e7a9108ff925e56892e1a847 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3a2f00d9b2587ac31816e4d85a3358c04bb58049c7435c3b7f617ea8339f8c +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3ab7627829eb39851f929b46b980f6ab76d473 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3454ca19346abd831391ae815ae487ce3dc3967164a7993710c015b647a46f75 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6767720860b3fb453e46b083f710d798723f3cf0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2aecb49fdd4d8bc28f99113fb44d1897d2d1c55e622062fabe773760c9ae8b9 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6314acd83f1d38e5051202e58730494f868c11a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4ebc9a3d360da48a921a1de07550f00f9885ffdc4b1bee0a034a7b28e67d18 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee6036c69c9a8e9d38ffd1f89e2da3a8f59f182 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4df73b619e269ea93eab1f3173a7c63adf8e6b2d7dd83df69b48d55993d9878 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00fa1f3c3f05539f883ebcdb3cc3449e7ffd9850 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7d0726ff89a0d6e4d62d87a0d2d07d223e281dce91195ad9401eff79e4bd42 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db099bd2e9a58c1866ffe9a9f79f13c53387177c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72234839018af6f20daefa9fc04cb22b612dbed16124926d3fbc93cc9052038 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c9732b44319fd3533a8c18fa1387035ebdc2fc --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5085cff017733b6c66c0f1e1f8bae760770e1eb19e0e07dda2e2ec225116a99 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6c9ff245a68882fc6a7618cb514ad0b21216013 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a020a8e6c6d214d4c1dc0c335dfb2de4d3d4c83cea21ad569e1a7a22140f527e +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5429ad1c5b8bb3fa531677673cc311053940bbad --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ccc89b5cf03ecb15b1ccbaee9b8736ade388e715ff26d688a997794c38ca6e +size 199058594 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1221ad4ec12f0500b905c366fb322b68549108e9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d91b1cdf9ebf7c27c07e25d9dd621c412f15aed6c6bb10d0589d11271e8b5b3 +size 199058594 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6108a1fdb6bef9595b2494f31c78d90ec1a3ff05 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a172ddf630680dbfcbd3d018e00ba14901769e14cc3ccdfa5eb0520f9c8da992 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f2e39fc9e7e6c04fa523559fac1a1dcb6a7eec7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0df583abfca44c1290a3819ff6bfbe7530973e0bd7cc32fd13283aee3ca0a50 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7918da33722f90d2e87c13dd4fa5f6dab97a2097 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2401d59fe990d8e63b407824655af2d34f7769c5f9d9a4dfad25b9658f534b +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bad1a7332dba7084334637cdee3aeb7fd3c2a67 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd1125a3eb67e26d293f0f421177ef4ccdebe551682b176d20f4fe4cd06eb40 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4a4f02cfb468c7b03207cf9bb07477a0092db2c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff30f5fa25d0b1002f2040b3b1cb9df099e3fb8aa0a0dd39fc106bd221ed7525 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4be681e3f9a3ca883579d8c383ba34ce80851d38 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3d4811cbdf5138216a56789625504dbcf36f95c911ea1d730aa743c26d66ec +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e18eed6483fa8c558b1686b85c58897f164ffaa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f489bf4bf8bda4e77051b8432fba153b1bcab0b91e2a49aa38fc41a7812db0 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1876bf4e29269ea987cf3fe80171af3ff66574c6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c6107a8580c9aed4a20b8efa3b599e0bf101d69e75333911afde252509d507 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabe41b5a6b9f5012712efbf30426fc6d2dd5a6f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b579234af4f620dbf671d91fd38e9ef4a537714a0d468a9cf0c0d25ad179e3c +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be4e0b5df2fc7f96f5970b7cbad2223a7bb862f8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a549358bb730ae7f9b2adbd970a7e076ae929d3ed0c23e9acc3f818d906509a +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721a9c7232a69171451be7a17a106b5beabc0ca6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8385808697a8fad1b8ec5623e5ebc2e8758454bc2dd71fe3309260c5a84bb7 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8c856a39c80aa5ca3111936e260370fc84be33e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81e10804b8a0d44c3efb0ace36f9a5cf9b4ae8b43c9073ce6a929c3857c4fba +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c05c82f1403df1c9d2dc2697ae9134b2ea31353 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4593566fe2cc5bc9c1ee07247f48e02539c7381568607490264e0993eab110d8 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da9198417901c8d8798e3af0efde8974640e608d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7fb97a4c95d13037271413c4223cf59a83dcc70d3cef3ba1b806882e4490ca4 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c1f7c9e3593d786cf0b3ee610cd1d0f9135313 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f22baa94be778b8760026c72ded09a8ce883d7ff501cf83172fdf10830ae443 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14483fc6710009795cecfd906403e97c59ceb2c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb6a08d12945e393f2e5eb379145612142b7e1e55e5caf0e2d120ab46524cd5 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30fc20054219cde445da8d8cea49b57a604e2682 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc91ec6dfeef3742d78659186a775e6ab83e4412e991bde0bef94eda169dd03 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..528dfcc3cd04c600172c2c04f7f82662484f610a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778009848fac65b622e1235fa18930d6700fd80577d8ca6969af0b4f9a7d52b4 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd14a1177cf4fad5a5f962e5f1d57f69d6f99d68 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4d946fa7f3634fd21b194bd583bd3720bd745298ccca119fd55e2e0c0a78b7 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ade609044ce9b5ed71d1fd1f90d48ac3e2c52b3c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92242ad9d71106eecc41c4bbb399e72e25e2d1ab3b5771e0704f002370c895f7 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4358f24305d222112a4f939b4e5f780f40945f4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58bc2e9916c062c9d85c18876ebc59f094b51f193a8b474968f44aa692f33308 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd54e1d357bd1b7f8ba3e84e15c885c106c80caf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5421f1c4dd12002c75f7397cfeea317e2f507a464377966d4e0adc8fe13db8f3 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4960ae7e93ee1b6e3edc979d42a3a8047c2fa612 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ed1f31d64ea245f8a0c0c95b993b98c70b9280e8cc5d1244a8a5084058d2b1 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b0aa531b4fff96fca33b277ebe0cdc7b27d7ea4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29b50a9f56ac57e049608a51d16718e6187c6e8601f52c9bd99d6dde4d124ea +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21ffe1120758caa6582590464788ac929d794de --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d52e61e7c335419d30aca7e8a41d48b0173e1300f5edb8ce8caa745e6204c2 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d6099e9c2a3b3660e78c952a6d76b5dcc1dbd3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:680743a981ae31c8ce223b2fcbdeff271c41e7a3970e5ddef1556c840cdddba3 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b9982d67ca982b1534ae865172df932ea03d9f9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e70583320131aad5ebd5756fbcf4deee59df0560e3ee8e92f7b5a3cfa6252d +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42443edd8f16a54507dcb216f7e61e731d0ad620 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e55dc1469de34e232892d43bda3034e1e8503c3c95b7b1c8eb8e2a69ac71051 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5791dc666e4a50966599f85495520008cc2f08c7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90303cf2f4fabd22a1b8a9d860170bd2d26cad02e14a0750ee2a79d0cc349dde +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c554f56d06aaa667ad7061e2f58c137dfd8fdbb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c624fb0be94c7fd83288ed82c4edf2cb6ebe88d1eef3389ad5df3378eceba038 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..490197b3413ac14d8b733b01acd2e84bd820115c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842c965faed444618ecdfa309b2e172905e778d46abe385aee4c2a322fb6cb8f +size 199058775 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7744c3e9f2e4d574b2d083ec9f68908f16e9229 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc3bbad023ad6ce5d45c68312563d43fee59174779ec35ec0cdd435185bf17a +size 199058775 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0cfcbb599739ae8bfdae760b372c9d103212d9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c35d535634599ecce91aa50f791f5a25048e95c164a5a5bfed37e8624c7f38c +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f1add5160b033fb7e921eaf74d67b0fc02bb70c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a208c81a10553b833526f5fa8d23415437e55087617a8e29ac38e2a7fb0e98b +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51baf0bf381657e7840fdcedee8cc08a4d1d5697 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f03c4a0498012f599b8b4d12ebcafefe7018acf25411b5451472f4fcaa5e98 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7422b52547fbf46c8b066c7e17db645c8564db59 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5991266238ea50ef7055aa54419ecd0a7f08dafbb5fa71ff5c6d17989b7604ed +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaeecdacbf1f2a3239f627fe6ca8e0217978b3f1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58be04a6b4a9b5c109cf64837e5a2866a3d0c4db7c374b9940d28059f6cb91d +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7581ae861725bb0ae534c2f98dfb56063681faf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72ad8f39a623e888e5f722300cb378481b8fc3278b57a94dac82f04dc5a3818 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e972d0b56e1548e51276e534882933eaee5d176 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ee2100cae2cd43a5ba7a8a1d172accc4295424edd8e0010071453958c02469 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95fa93f40ad31406a7475ad89daebb3ab99c40a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a35cef44db8f2b2bdd839c995d25b3c5f23ec07ce70248ead474aecaab98a39 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad83ea29791ce4e993b8b6372a2a65b2bd180562 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced0ad40446df900b414d4ea841bd49921d4164b22c3efe6d56ab49a9f453963 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a83cd1fa522a5e3bc2a1e39d116a5eb14acfa2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a19e4ef04b74f89a34d7c601a106a50370649e934b4eeb7269243d2f61e109 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edfb875d22dda9342157a15088d443c3a42bca3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c401d81ddd2e064aea62a82dbee47ce6cc8887e8951dd3ad52d8f71724e0f08 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27d9683af3b150608ea1bf41a31b6f68cd9999d4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6cbca0104e4f188ca35fe29de17bf3e9f0f1bf4883ef0466ddd17c4f4b0cb2 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d3cb880068e422d7de77c9dc59cbf8f9edbabce --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568abb678397f26fb28f81a6e1b2a769f95c8db73c8eccec983ede80e2760bdb +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..095168b369586d9672e21d72c7e6f349f45bd2ed --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49eb672e915629d6cd98a3b08c7d68e4437162b8ed94a1100cda328111da9b4b +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cdfc5f4319edcba44950be4fac6e02a7e2c425d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b117a395c0129b748b18b7aa677fa7b6f2da365ce884a77bb8f168a878c7d0 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02168eeed4e63887147405b81bf11b6c14f00c4d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73dd505a47cb2a9313337d7ad36f65c715252d7464c2246bdff920415e9314f8 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..188d049be4a43e8f60a78de943c5fe8bd1500d41 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994ac768cc926b333bd4a1ffaa11ef3b9a023d5cb67277a37d18c0659526d24c +size 199058914 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b729b5a10912edde487b5ee94853256c142137d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d6d49b9530b39b51b5fcd93ed614c9012bc3f4cb44d6f29561726cba1bd1c6 +size 199058914 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eaa71a07411385ee91099ac52ff0c6e3a7d305f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181fe56a313b31c8248b6f6120fd177fccf92d2480919cb0dde69ca362690ab2 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e12d725110d8fb7a89f33b66050234790a6997 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b976992f069d9e6b35855ae03fe03317f210737e1caf54a7ba1097de53be387 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..294a9a43d50170440eaa7473d0d1724258e3256e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9443018c70037e86ee25ccccbdbd177e35e3535c72d1a900b71af2700b0d50d9 +size 199058711 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..249c755ccb64cf25bc714d051d30b24417327bb6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e23dc023b076589166b89c768de355c8d8d6bdd8b8ddaae004277c65ec00bb +size 199058711 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e8b0e5cb17636f74717a64925ec518520efcaa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:055bcdc92b29adb21c80a783dfdc07e1064629e7a4e0f1c0a23cf413a4401cfc +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5649ed64a372f32d427cc3a7f94caa1afb023c4e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eabdab5ab014496f724be58be5eb9649469df0f6779b479f13e0c3cf31538f92 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff4f66a957fc47b59886807b3291182f427cad8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28063096c0cadea1bd9afc52a7911ebcd4b5d757f4539c1da4d03109db7a3f68 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edb86d2053a2315a2bc4afd2e59fe8673c7c00d0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462d727e0879a242db00e06c2435eefee5a4961b1915aa4406b499b192c86131 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a173a6d36a3375227047762e5acc1bdc4818c9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abfc64bddfd13f46728ea7b3919be679ddaad13b2922d844840aa6fe50242b49 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e23210e2a50637645b5d0677ddafbbc743635f3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03a7e5131e6f47b6aea60b917eb5b086f2b3c7025bc445da3421de6d32f0cb2 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a46da6b5d548e0bcde91d66335658823bfb5f4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d28a8be82389242ba8a2d27757f7c8333181fb7e8172ff0231ba5ae9d271af9 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16759b7f33c7222c7e59370179f55c9d681270af --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b64ca14acc6bd344e30e7bde433155fef7ba080898c8733c2cba185877fc2d0 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8546a14f2e89e8d32999dc4348be955584cbf95 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd3339683863882bc26ed234b24b0c715b64d0a95fe4c2574610b30f2e6968c +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f59dddc930d828939846b8c3ffddf0069f8f141 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504199535c66174d2d69de9b646218566357f054126e7bdf7fe67453fb0dd485 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..135dc3c98caaa77c9166ffb6f8eed74c30150016 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2479cd72cc4810d3be5f4737f56d77790a2a1191460ded55dc82737c99bd6f +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2694944f0f1f3f24b2b9262ff7da77d912eeb61a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99637129804920c0e2f8b05662280124e8158f39af0f6cb5de1d05435012a047 +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6858a0e5280dc8f417628ac54751f1146bc76cf1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e73a54c1df16e56efee2ca555b4bc9e8421ccd51c21ddbc7d41390813ff727 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f63e42b41d715b031c801bc6619f23689c2b62a8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b80318f18fb40bc57f2a8edf109ecf10f3cae93816d2081609a79f2e13c2315 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c20a3aa12001745ad130e321f65af0844dfa1bdb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cade20e4b8bf29c8335444a8d01d526341bc90752bca31725f1c3c3d8b1ac76e +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b513e39cc0d27e3a8d9ff6b13fb8a6a8784ff51b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c08a042185ab6af04564e53d535d865f86e0ca6129c2aec39220b019dc945b +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46aaa1f5d973549e31362751ad18ce1e393be69a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c69c8a335a881b95eb920c1a91e20a76d25f1be4d77cc9df0e1e10ef0a5cd79b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88860f48df64a2d67d38e32308d385c542823821 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3e3351cd1ed0ff0a7f16a104cfde63157974f1841bc140e7f670f099f0b12f8 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2189ef6617a0c1b1afcac427165939dde29314af --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ab03538e0513392c7512919d10a0a2f44973e68f21f2f11b0f586036a461fc +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b45b4c26343c18d2f6774a236f9465b90cb30d3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3687df7dfc94869ef32a99b3f17944b6175ded5e4698cc810807ff851c2c1887 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e58b4d46114ece8911a37ab63a3c8b206b6a3d9c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c121c85c97cd94264892122941993e2f9860109fadc9f9d62dbfa6132d490d21 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab14e2893f218f5a7ad3f3dc34b594a346e962cb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7066bb23421444900f19e678b06dcc26f330c307c141c34c24e9673be2347506 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e278c0932fd19c4aa0e8e5768479522eba7a67bc --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39300ce8676f5cd30c533ee3dabfcf57b91581b788a39edba10f4318a07adaf2 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21461f143233542877af294b1ad3789a5b83abf0 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3b5c5c23a1fe7ca1bb663d4348590d584275aeab35bada1e29443f5f0bea6e +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28c7644d3e288b9ff54452ae7210402ace7da1a9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08213584f4315dd61fae87b0a52a0e8fcd019ee6ab577c6ce82c8bb05186ffb8 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e980619079d7197aa8fb95b11136009e73d09329 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1d184612bac34a129b159f6f14202f666db3b47028fade9681662d8064a5ec +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c5a56a760c0e069a4491e6292d75b8cc7afc84b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f8ac5d84488966609466e1e2d995cd279ba8107ac90130310b319e93029dec +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a595c23fcb7b57c15069400028f1f3b51c68a9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8735998c92ef54e6c80550b181b657130f6e7a0ebe4f02d0cd25275008f73197 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ab89b084d0c2a272a2f8446a60deba7c679c6db --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d96715020d9b64b4ee8c0fda24d9bd96fdd926b90428688c8a53ae36a9a84f50 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5136e00d17ebf2d112b9a324cf8386848c0554ef --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e327533999d54cc8d6ecbb7c712633b631dc954250f0b9831b3703d403b4a6a2 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb10ab59797e9daea163f65b2e3fb0c2feedb498 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b836ac67011f471b7406029b3e22d2d21a9360f6c7bb486c2bfa125e7e6aba8 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fff601e705bc50738341f520a358762fb206cb29 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3467a7c724a2300994b2fcad9f6e2e1d1cd77f204078030d7a60ada7a69f192a +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55280b77ce42e38cac4c801144370f169f41591 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41340586151bdd3aff72036ab71ec7fc8c3695a5fb871e39c572744a9a988af +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..450edf0298e107a7e035b7084cad06193164f503 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c994322775dcd19ef7d918490ada2834715c3e36a844e335d459245553f60f8f +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa1031f8b411a7e3bd787411787d1a5d9891b34 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9430edc155b1f1f409e950e9592b5a11459368e94043d70a238dd56f3ae9617 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b405debbd5c828964d5520cc757a2df82af50ae --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f9337de57c99ecade58516a248685d39b28c663b9514564d3b67633df23ffa +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ff1ba449345a8366f3e6cd82677aaef4ec5a0a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47214fdd4c1698b9416870aca8478f188987b4abd158882ddb6b848aad0e9833 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d639254b0fb5d5f6b18c84ffee7f6ebeb9dd4dab --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9161a78a22c9b33e443721fdb7b41b263ba8a211b3fbb7b888fb856a10744717 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..707b1afc79f044a68733379a3d67e1a15dc3ca37 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db4c0a67767551d900e673ec80060c2f5784dd974618d2891bd4cda9d6aee5b0 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28adecc8f768b0be637b68fd9500062d32b4d13d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0045f06a0052820b2d5cc7756503d121350974ef1f237d7bf3d05348db019a0 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad0138bda201c679598274ce0cc75ecd1c2cd23 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65aba36fa7cf0c55cfdf3e97c8936e2ce4e30f9a1193f707a3369073e00e8558 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd0500cea71183e70f7a451ff8648b0801b52c8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e54183f24f4f11a1f055fe6ae663b89c3a211f41e83f732411235ff1820101b3 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02784e2189c48b81f15c7c0c7e50cad50e8d742b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5869d94381a3bc6b06137253cbc29f907e56a6d33f479da93ab60e6ab5abd05f +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf4f32c61d21038acb491988101dd0467364022 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7e83a55591045772d525a8d272b35871527ecf1e92122b3d13b22604d9d4c9 +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ef786a17b8cd18948236ce5e05480f7497c6cd --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c01a4a60347465bfa6f3db289af8134fff5b836be61d8467a570bafcf3cd478 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e354e8ec9325883d1fbbfd5ff2e5107c955c34a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2817dd6d8cb5163db940d4733442965378d8ebe1c16194babfd07cee2a789447 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f0e7fa84cdf9d097ad8a2863bf8486cd772065c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45350a96f1ad47f6209dbeaaf9cd427458a1f3a3df263bfb56217bd4f7919783 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b0d036b4eb63fb6deae1ee64467955475c79a9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8662cd01aecc3937f6c667d6330b7a191cd0aa0622b501ebd0b77575df3140ad +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ac7bdb6565a9d3cd9c47a06c2f92d6199f6ebd --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419fcfa6b3dd680bccfcdbf94f5f10b3ff7423c8b22027331d0b3e873b4fb677 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae170da161bfd81079d62d66de4fec962a449999 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509a96f632b83e97a8315a385f5a954e109c1cb992938d9d71de5373d6327276 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b5c3702456b4e942a2b5fe34a51b287e5abdd1c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7eb76359877083541c9e13acab7be02897df4c419af5acca6909d0d2cbcc0b +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9781ee8aa82e7457ef2fc5f79ef3a57d710bc8d8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8df83f699708b89acf258e9be34d9c6e0b60e228252629508aea15b80bce944 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aec8557b6382ea38adc7b1594773fe87430229f3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d8167097f7ab3398b3ca9114977213bcd6c3dc95b009efff3485d11c097e3d +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0814d08fbf349e93d68214679c4ab3c7d204ba16 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f87d1db5a0d5e61015eff7fdd0319328cb9cb80bbaa91f32e6c2db62e0a5de +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..898931343bb88102458dd4239b53d3e4337e85fc --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc107095c4ae04b897a8a8c12edb19396bcc698a99e7d54ae1ab2d63a79c6a4 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfea68267bc26e26634674ceb9e30cb608c25d15 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:286cc31351b42d66e776f2da8533ff665e039b0ad43d91e42afa6a7074e0e1f8 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..430784811d04eef221e242276a53e1b827461178 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbeca7c762c0877fecb4795abea3be051f4a0063ebc07a892ad13229fdbe8b90 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e6a70f4e2c364da3013afde8258aea30d1d9694 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32d8b4a9348c74a503eb3fdfbfa61adc5f6004ead78a9c4bfd575937229cbdcf +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bddf08134d0f55764269c85444f0efce6095296 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0692fab2f73f242a0c2b5ffadac5b8f075338d10b1eab48607f00c935bbbdba +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa03d450820490f60aba6fad697045108da843a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b838dd1a244c94b22c6e0271a479d01ec41739946ec7ac061338cec932e07204 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d28485c53999a1f334e00b653f860a2d30adf63 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb4209246bb27732dbf4b56aad7833acb5787f9295a678bf3ad0a5a1ace0366 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c501d77bb3c8e544741249528f5691fe20858e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3da914a3a046adf6ec6c9d5cb33a57ea9d280bad9a51aab8a65d2a234d1020e +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0800f122b62205e897671bcac9b63e68e621528d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e36c55d95d2a0cbb2bfc619c8bbf7c00d031a61523109434bf870034076db29 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eba02361d83cf4dcbd0fbb3c6406ecab249839b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:202c1ea6fc14246c341c8065e3930810c61fc86334f89e22d08f469ed8cd4738 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a51055b8835f632a1623fa3125dd578c4bb3c6b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ac42910cf2b765c2a5c1ae1ba2e9fd995d5a50d422263dfb1bcc8063f6c99c +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b74ad1636771e8cdbc15499bae42339369c126f5 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f158247c78d5a14157ca156066684678a746396de5a0375ba442704661bc2b4a +size 199058647 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..332e422967e7fc3c07a4d5717584f078a91220ac --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf78b30ae6abcb1fc10562d0e95dd76f1feb48c21ebbe8ec04711bc7a0c626ab +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40aaba9e50347c17f40236b4b81123369ad77baf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da6acaf128f203154dd2e281083147e14b9dd0ac0afb6afd585e9da6c55d5dd +size 199058850 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d85ccf3f025dcf9b902710867e68b1c682c3ba --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6aee5f86fd9b3514c5fa22feba487c94ab4005426d06bb338dae62060129de +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0e68b240a4144eb32921f803d3721a7ec27cb2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1178a059ec388122ce5cf7ab4371459c26d3cfdabfc9ce495c8598f9fd8794 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8af985243ee3830edff3b93535e6153ff038ddb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f726855cfeb42aa5081e2d5f79b3706004879ec83b5ccede7745488567945b69 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f1ccf2ab91429412b768c27f95875515626869 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:373cc15658a6808c4bf93fb6df5496094fcb0143066982101d4326fa718b435b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27f3781389b3da7786f611ea238ef6c3eca4dbd2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f9654d1648901ea5a2e132fcdab1da4e301ed3bd8e778ecfdec793faa517e6 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4286931abdcbd9baeee6a8c444cb7852c4d3144 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb80e58a8c2ed864ad2c2297b5475825774b6e994394013423ca13bf9e2119c +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25a2d8c9a022f3e2aaf82f643abfc61544dc399 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14130fb6a0b27e16373f6cf55e3334e4c274a7cd4d0d3b709dc67e0cc7a0ffcb +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f23f3be2fdf4023231f22e5a957cf12a1e190e4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f60c6b0c5b574359c4abbdd1e7e9529b31fc700b5e63cd9dce48a8e47211f3 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f6dd8bb5bcc7b305d11045073ed44b0c6b71c4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbb27869ec0b4c4e7bb3d54fb86f8f6e6c6be2ae8b66b15f4498fb5df854195d +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fb88142b3a6db4c1ca0a9a562940a63d4efa7c2 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6fba18d967bc0eb5d2a13eac4548211ea83f410f1d796d3bcc2505aca78c8a8 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..008c9aaf0ffc59af5e24b5862687fd7f202ac45e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485ddf48d812e687339b225705aaf37915a1a1a309d56456ed1d33a84e7b0a70 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..434247993b81774ac9297fa464362d001abbe9bf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11cd4b40a28324697f07cd4ee6a82c474fced4c3e1788d9132ce5e0a139e2b7 +size 199058722 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e8034396598aba348f68197819c14fe95287804 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8e639456ea0771841d626d38c671dab420de49ef66a49bd758cd895031d4b6 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0bf2f062aaa73995530e8f2ef4d98da6f4825f1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c42e748c6deacd58f18b96eaa664b345923a7faa99023623e4358676bc0162c2 +size 199058786 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34ae02603eab47c312e3067708ebe6d3b8c6630d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:641d765475c5deb99c8a4cd85aad39481211d8f7fa811c69f12f8f463b8e7af5 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14dbdda767e2c15cd38026499a371978c0c64c4d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efdd007acb49f623865ec9ddb66b6bcd32a34fc25bb7d6d3b7d09993d5a34b7b +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac15a67751a5dbd9eb550cceafcdb6fa7c1f54a4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66e4dfa00584beea951fcb18feb96d3b781721907cca0388c487f32ea12b760 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12104dc55467f461193399567e8a2949f3c4530c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360849fa4ca2d0d31686ec5da866327e575bd374d717bf3f3f26db9895b9a806 +size 199058658 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8196aecc7cde78812651d5c08751d230a2b13a22 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751e7eb7c799c6cbd7c21e834eafd99762c3f4e4639a8639ee2f568c8bb4141c +size 199058839 diff --git a/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99af8de4525cc9375fd876de4f3426e64939b0fa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d3f6cd8f5ed882e6828c2c60c001a69a53bff5cac3f47d3837fa71bf9357ee +size 199058839 diff --git a/4b284b42bc4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8310054c7bfa8aca4265d04f524375d0b61a5a6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8448c32523a94d84b3f023df9088735a930e6807ff7305849e1312336de9eb5a +size 167511299 diff --git a/4b284b42bc4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16eb5ab9c579fa257deb374f0d6570bd2c6ad44 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a57e0209f92f1544c390456120b123ca98635e6bcab9ef29d599ade5a618a4 +size 167511299 diff --git a/4b284b42bc4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d61501f36e1185b9b53e0f96cd15c8c8ae09cf4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46d7714c646b24c3475ea796ae137107a8c79e75cd5bd721bcd4430a8eab5bb +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db0a58445f73a460c9241d60315d55191afab145 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d07f492a99838e473d9a61a674bd2f589603c4209f816c484de1c1cc61c7e16a +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cad2bdfa31e4bc30f1eed601d45d709a3e4e557 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e111445015a7e20f54a100ee00d16f19c9c0e3bb29b249bfa683952209de07 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02adf98d7640f26326d48c584c07015ea4e4d34a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d77094026a064131dac24b15caa23e9b85bc83b233a387d0caeadc31608cdc7 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd32d805be619deb8da904116dc4ec36a8bbf57d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a2b7ec25cf13e7ddeb3529c699be2ac17967f5ba29ae3e4454a18c606de39d +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6368ac0773e54694381eaf340b26a7628ffb44 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5039ab3727f2ccf85e985cb8479f101b60b14d30c58eaf96d3df0e6b68872c28 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d314920a0f8570f96d22c7a2156c3e376efadeb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4086cfd4d7c474bcb3c6ed8b3ff4ce3365d10b677affa1a07f021067db335850 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4987815fde2e78cfb3855e5a4cb4d02c2d7ec5f7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fc37c83c6238f1a076d79f86566196db70c2f8f76bdcb4d26369d64dd6f6d6 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c787b0be3f85fb623443e158b45b3cd228b1fdbb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c90395aa2f15a1cbbbdbead2856716688b409ef0178fbb8ca7c38805787bdd +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2c083b0ba73dfb3fd0b10d5372d61a5cc7b4a1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014db8ae06afa2469c818f27d03841465625accb2aa9ae8798d6b65b0769a268 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d62e4f619f2d2b88060cb88f4dbd3c07b7f4a969 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06e64fc910bfa1d7642892eaf0e22ee6dc6838b960c8a4086167a288c8787de +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49ca38f6b0e205180f1abcd41756e2b954804f55 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8338cabd9288eea6a383a62c4918d44403bd2bf23c39e439af4bd8c032c8b28c +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a38d087acd15ccc55466654c0a35bfa52505ffd6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5445e90178caca4fb30ddd28e380f2066b63189651d3621c5fd1e9fc04ca660b +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8522629120e86a81a4eb2b3c224f0619c6e96a --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf467b57301e047a028622aed07b4f4d6f4ca6207d224e982b7808df0e5cf89 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc94071c67e544f79119a922b3cad3425d5187b9 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d075d6c9680d1a6242c00d47787bfe4f8473b85cfe6a7166d89e2351b11510 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36df136ea244499b3dd06bcf9680eee8f4ac285b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae056fc1300e6f17c52c2c025a2d7e73daf75b6574d2d4e743ef3024341f6a34 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0aa8d0a874f04c14711826ef6a8af76ab037db --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16f186791b1cf9c4b41b14ae4c95e5ceaafc9fcad9a498bf582f3cfd7a30b04 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec28d4868a194ad2b660d0b8dc09cf3f79f6066b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7098fcac0023aa0bf81a7d4ddd5eb394c8822156cf48bb04261a6c0ea7631df7 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe7dda56c71a6592cac119590a38396e1a5f1ad7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5faa6ea342dfb609509e3d20f8a9749afc18eab3fdad77115331a68cd72cd36 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ceb99b0625733eb10832a904eb238c44ecf9c19 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e99f88f5024aeb2f813d7c98417320644b5bad3c2bd4ee1b0a87a225ccc11bc3 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80232a9cb2d0ee5feac57694e2060b17ea621ac3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c065877964ae23565971c1288ab635af14429a7b2306de9aef7c4893417afc +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de94c0d83ea16965dc0f4c1a4e925809aa3f8f22 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52e54f905dbba446583daf12e8869caa0cca436fa5976f8d9dd0e1b4827ca1e +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4c078493be73fd6dfc74b1e0bed6bb6e946351 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec8cc702200217bd5b934e05ffa3e34e37396492eb5ede13629191e500e961f +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a53188c8a210f7e6c970a958f9951faa3b4f0dac --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2f453d95113754a96eaaa1caab234a02d130780f7098b607b9a980d41f2a33 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce33b672f3dd26e74d4c8354cff423e5aa0a554c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553e9e78f8da2ef705cd158a35481c5b00fe06a69b9d6a27547f29d7b2a0227a +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b3d7b677c7462eaf01e8dcf51b672f322980a7c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d745df7ef9bf25f6372927caec23a91cc6a1593829769a2d5e30d923585aeb93 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c814a478812760e037e80adb6fe0f84c68fd469 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81115573caf0877c7f73a7eb6156aa4e0ad9b4933740aaf65c8a5c1db98da4a +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4c845677e183d1741fad7873e904c426a16919 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a14b693f103fa56c59ac407b042e02abd696fba7ff3567f01d966f5bbf4a63 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4297f47472c41c4ab0236025f56196ba167a91d6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f569e221c49e07701e5ed0c93fc9a4c255ce99cca3756a10725ec628250a0dbe +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82886369f90e7f673d66584820d9894700564f07 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb76e89d9b3744de7c4fad50c2fba11891442a1a5c34800ce14165b850871fb +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ae37a0081b619c27f3982f04958fe5c2cab011 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a27423e2234ff79a26c2cb89ec3a46764d70e11f7d2a3d588d7bca6bc76b97d +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e79659fe2338a2520b630da1b17f124d998cef --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69294d9206bb09353e6149cb23063cca3c807202da5cee7a992cef474e40a1e +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e04e0a681752ea4e8a5ff43a3fbc1ccb2defb7b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e7f31200a31ddf3c72e315e99597f3b399384dc56454f55335a18007d627b5 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e570c28ad8364650d7e988ae758720f56068f683 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55902668f2b0aca8ec1cca6809b45e9c37a6f4e8d6217008a12cb5952516787c +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a95aabf6b3c3bbcc6ff3294570c01df7d4933d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49766cda67d06359adc93d85f81c2d273ef8cc07a261f16ae1fe62234d2d5b68 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cafb2e6f9afb0bc84803aaa559e3c80c9ac4b1b8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed52e888017b91922a3a524304fa17ca31bf988326db12eec523a1130d18773 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbe1ceef31132e27c3cc87f896c8080942751821 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f19e8147c84cdb0ab296f47cc6f412855640e252dd5b70c0100d473852a332 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c85b8eeff8979862ba4f1fc623ce93e0c43005 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452584de2ec76e11f7327c15781512bc4703a9fa17e99aa0bb2dc1936c8e6b9f +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..278a3b7073e71e469d0175a656f38e3c7e4bc8ac --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543939dd72dfdc334dc6edd65e3d5026f72e5d06eab793d3c25bcb2c907b974d +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf4984d26952f667c2d4e01fe4c69fd9b778c52 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eedd8f29c2fe42ed6707cefcfcd00d4f934b4585b0d94372a5bf617ca2f5db25 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec024942d8efabde50cd9be468abfde7d364454 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73363f5bb190aad9bddef33cb8911b6c88328b5fa0082936eed3326abbcd685 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56de2e19044da978e074d0540e94ca04ae943538 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932fc0ede698b3def92aec3b8e4c24e9c6ed12d054ff290d790a2ac77d009d27 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ec21ef21333c94ff2f95e2d9ab38f1f39a8d464 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077e7415ca66d9736b2ce8f5603672129769b6db4c7d4ddc73cfb31dc9bb76c2 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f32c55c780125f1fb6f716f943e367fc95866f7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dabf193ef6558f964851d5145b136898ee23762d7242e35abcf6569d24604fd +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df6c73cb25eff63b35f055662fabafa68d8d48f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b69e17e52c30abad1e2bc0418a3e053ed348e971703c57e41bf92368ff21041 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aaedd7c47e7be55d43cfdd793cba3e2a373179e --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017b78cb94a4384b3b603e846fc28ba7fcb6fe3f2e6d69d907db970384e5c8e1 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d3f3462b478ec117d5664f2d3c470e7932132aa --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726c172556dad1dea575b68285840a45578a87c3b8c9e45ac7e9fce65b746327 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4dddb8bef2e76a4ea8e683bc9d4e3dab8f0051 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244bef16405958d6649a3fac304056f61bf21368bbd7d596d51e4ef23595b454 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cacb902a0015eb7aa43430c480cd5621d12acee --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fed41f79e3fa4b0d4e14a948bc37b8da6a979448b4d4ffb704443bc0abc30dc +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b1ce63e9532b44e2c360a1769a748a92a9c9b3 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a516e293584b0a970ab12f245934bc7d3e64542048525a8d6584c3985572fb04 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a4741b69df8f51b849beda9d51a675e930fec45 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9bade7754812e1603a2284d36fd7ad6b3e26bbfd37cb293ebc1f54e69b3bec2 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ecf8767329ac66cb412d7d6becd41361c998e7 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80303b3794184ea1c06f420f7ddd81e16f5b8653035be41064b3defd86cf84c0 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5d048fa0e3115cedec72f5c98c8a1aab63e10d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c64efa4336c430538b365a941ee65b440885c4cbe8ee8813df0b11a9e5659ff +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd18afd9d0eab00c038bf6efd9b87c88d57ce9f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6e95a78ab7c3ef110fc7a8bc49aa686492e214281190393aece33b7f8b7b27 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb2772baa8c3b77345964b7a5cabb9d8cdc4c7b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbca46c3e14c227cf796e30569c92cb70c21e822f198dcb4f8e70149daf9960d +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4fa62cbeebe76764b111ede970d3b7fbf8efe8b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61680567443476df7104ce47e7dd298918ae6e499cffc66404758f05e4b46fe +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eec661396ed635e487813151a7e34a79edad285 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0120facc1a14a5bc01ccd908b2f9ce1102fd2c189e82397d2f0e39332827fa +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e047195507bddad76726c21ad7c0779fd2dc9d4 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618cd498c5fc84a3b811a01619b4d1a8198b72db86c10c62f3fa921af72475c8 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..860bd4890ce25d04053701f96141f46c732a64bf --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d24e53d26f7e4eb0a8247278b1ea898dcd901a75668fff79b8e69541f46af76 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb49921ae884fc96a8fecc1b9495b1b84472100d --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387e9e56b87580a677300816822f0c6ec2543ed1adf702f74ba684d056eead55 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf861061b9603536ec990fc5014e1a701b4d40b --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7864d38f97223224945ef276c4187a490a4bb496b7869b2ace91e6b392d34f +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..579a193deb1112e487e9444650eec7d2bc632fbd --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac2356d315c7cb4b2bad33bc8a8a2bfe313f993b5947a1511ed4a13a3e7314c6 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46791403e4a942a152d08a2ec0692f1c8712b670 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d774d8619879d323a4621141057334bb7d9168c7d09b1e60faf16c9a477a6c2f +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b29f552767bc90372846d12c7a4b4fa75d964b6 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24ebfe74e017e9a1601bdf965c1a0a6ec13c9555e50834952468c2d83a4412f +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31c4a5846069e3497699ac8735d321df1b4cabcb --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3379ac84607511cf729f1ae44b01f7795cb660b1e411ff60389768a9ba2f402d +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..702becc0207ba3dfe98ff1bcfa2f06958c1eeb47 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3362937820b7e5b55076922db4727d51659de129f5ed9e60ef6e88aff21df3 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01ea136a564ee8ac47f22b333c2a1c6fc828470 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d190ff7bcdba773d5ef3147f6f1ab19e6bf2de4014338e4d91f0cf0cf76a8fdc +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..467ddaa9bcf88928a4a62e5b60854af75c46a4c8 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b941f751fcf168edf96c9a7cc8be2a79983525b0f4cc9de8a21f289735a11c13 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fddcd7e01b404c67cff8af7811e1e8643ab7cde --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71a543a9fa28b374012ade70fa9937a0a46a70b8c6fd28ac7cf6a9a22eefd86 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ddb9369aec6e8d85a5bfc53a623e505e54ffda --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3dfe5b13e84e16616510be4c29622befbaab73778946b102e912220574da64 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d0875d5847159fae7c58d5e607de678075011c --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d87df86f93fbc13ba480bc237778152f7797a1473304afcb0a7e5e964884b8 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44e26dbea1b9ee6a4386ee8f7b013bbfe87d00c1 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea6e3464db6960275510db010e5dc5066a24b94f106a86a8e898bf4a79624f7 +size 113308931 diff --git a/4b284b42bc4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bfcdfca33efc6b7ed8996b354fce3e1fe44182 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e730252303f2814b9adc32b8f50e89e45954ced49771d380c138e7dbc68ff1 +size 13507 diff --git a/4b284b42bc4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b42bc4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05e080db08a02dbf7b0cb1ee446d07225b60d72f --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bceda07eba8945c75c3e960f8249589bc9561d04f6f5872f385e1c88ebaf583 +size 13507 diff --git a/4b284b42bc4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b42bc4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f89fb00bf970e6ce1cd579ffea809ea07a4e4835 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93267cf547784f9afe74c63f2fbf2ce94e1b7942872db24dcc341ae4c8003a42 +size 51507 diff --git a/4b284b42bc4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b42bc4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad79d05dfbb8f63460bc774ff88bd7a07819c521 --- /dev/null +++ b/4b284b42bc4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f886cf9f68194b04f15bdafa372b631a3d10f8b3f32868b24239577193ae07 +size 51507 diff --git a/4b284b42bc4seed1/transformers/config.json b/4b284b42bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b42bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b42bc4seed1/transformers/pytorch_model.bin b/4b284b42bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7ee824f096777f6c2ac04d1ca2a34efe8ec6f8b --- /dev/null +++ b/4b284b42bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1356150e931ac1051691d9d834dc851cecf2238562ed1d3a5376cff85c95b8 +size 8781203669