diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..cfa1c7fca41a74f0a32e663f9cb2172c6a04c0b3 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.01497675877162034,0 +anli_r2,acc,0.335,0.014933117490932573,0 +anli_r3,acc,0.33416666666666667,0.013622434813136783,0 +arc_challenge,acc,0.17918088737201365,0.011207045216615674,0 +arc_challenge,acc_norm,0.2235494880546075,0.012174896631202614,0 +arc_easy,acc,0.4335016835016835,0.010168640625454107,0 +arc_easy,acc_norm,0.3846801346801347,0.009983171707009006,0 +boolq,acc,0.5938837920489297,0.008589510943787407,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.62,0.04878317312145632,0 +hellaswag,acc,0.2951603266281617,0.004551826272978059,0 +hellaswag,acc_norm,0.3241386178052181,0.004670955399641126,0 +piqa,acc,0.6218715995647442,0.011313980666854535,0 +piqa,acc_norm,0.6267682263329706,0.011284653078254898,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.732,0.01401329270272948,0 +sciq,acc_norm,0.669,0.01488827258820394,0 +storycloze_2016,acc,0.5873864243719936,0.011384472322969045,0 +winogrande,acc,0.5059194948697711,0.01405150083848581,0 diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4787b77bb86307c49c89dabe9cf2e2580bef0577 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136783 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.2951603266281617, + "acc_stderr": 0.004551826272978059, + "acc_norm": 0.3241386178052181, + "acc_norm_stderr": 0.004670955399641126 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5059194948697711, + "acc_stderr": 0.01405150083848581 + }, + "storycloze_2016": { + "acc": 0.5873864243719936, + "acc_stderr": 0.011384472322969045 + }, + "boolq": { + "acc": 0.5938837920489297, + "acc_stderr": 0.008589510943787407 + }, + "arc_easy": { + "acc": 0.4335016835016835, + "acc_stderr": 0.010168640625454107, + "acc_norm": 0.3846801346801347, + "acc_norm_stderr": 0.009983171707009006 + }, + "arc_challenge": { + "acc": 0.17918088737201365, + "acc_stderr": 0.011207045216615674, + "acc_norm": 0.2235494880546075, + "acc_norm_stderr": 0.012174896631202614 + }, + "sciq": { + "acc": 0.732, + "acc_stderr": 0.01401329270272948, + "acc_norm": 0.669, + "acc_norm_stderr": 0.01488827258820394 + }, + "piqa": { + "acc": 0.6218715995647442, + "acc_stderr": 0.011313980666854535, + "acc_norm": 0.6267682263329706, + "acc_norm_stderr": 0.011284653078254898 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-24-23_0shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-24-23_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..4787b77bb86307c49c89dabe9cf2e2580bef0577 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-24-23_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136783 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.2951603266281617, + "acc_stderr": 0.004551826272978059, + "acc_norm": 0.3241386178052181, + "acc_norm_stderr": 0.004670955399641126 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5059194948697711, + "acc_stderr": 0.01405150083848581 + }, + "storycloze_2016": { + "acc": 0.5873864243719936, + "acc_stderr": 0.011384472322969045 + }, + "boolq": { + "acc": 0.5938837920489297, + "acc_stderr": 0.008589510943787407 + }, + "arc_easy": { + "acc": 0.4335016835016835, + "acc_stderr": 0.010168640625454107, + "acc_norm": 0.3846801346801347, + "acc_norm_stderr": 0.009983171707009006 + }, + "arc_challenge": { + "acc": 0.17918088737201365, + "acc_stderr": 0.011207045216615674, + "acc_norm": 0.2235494880546075, + "acc_norm_stderr": 0.012174896631202614 + }, + "sciq": { + "acc": 0.732, + "acc_stderr": 0.01401329270272948, + "acc_norm": 0.669, + "acc_norm_stderr": 0.01488827258820394 + }, + "piqa": { + "acc": 0.6218715995647442, + "acc_stderr": 0.011313980666854535, + "acc_norm": 0.6267682263329706, + "acc_norm_stderr": 0.011284653078254898 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b4d06d30560902ae2fec5931f71e812459296557 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.36, + "acc_stderr": 0.015186527932040122 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.01349009528298952 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.28651292802236195 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2913762198765186, + "acc_stderr": 0.004534677750102734, + "acc_norm": 0.3249352718581956, + "acc_norm_stderr": 0.0046739348371504464 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.494869771112865, + "acc_stderr": 0.014051745961790513 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.01141582799434265 + }, + "boolq": { + "acc": 0.5110091743119266, + "acc_stderr": 0.008742934884517647 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763678, + "acc_norm": 0.3792087542087542, + "acc_norm_stderr": 0.00995589166886556 + }, + "arc_challenge": { + "acc": 0.1825938566552901, + "acc_stderr": 0.011289730684564982, + "acc_norm": 0.21928327645051193, + "acc_norm_stderr": 0.012091245787615734 + }, + "sciq": { + "acc": 0.705, + "acc_stderr": 0.014428554438445517, + "acc_norm": 0.658, + "acc_norm_stderr": 0.015008706182121731 + }, + "piqa": { + "acc": 0.6218715995647442, + "acc_stderr": 0.011313980666854535, + "acc_norm": 0.6109902067464635, + "acc_norm_stderr": 0.011374774974447464 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-24-23_1shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-24-23_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b4d06d30560902ae2fec5931f71e812459296557 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-24-23_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.36, + "acc_stderr": 0.015186527932040122 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.01349009528298952 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.28651292802236195 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2913762198765186, + "acc_stderr": 0.004534677750102734, + "acc_norm": 0.3249352718581956, + "acc_norm_stderr": 0.0046739348371504464 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.494869771112865, + "acc_stderr": 0.014051745961790513 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.01141582799434265 + }, + "boolq": { + "acc": 0.5110091743119266, + "acc_stderr": 0.008742934884517647 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763678, + "acc_norm": 0.3792087542087542, + "acc_norm_stderr": 0.00995589166886556 + }, + "arc_challenge": { + "acc": 0.1825938566552901, + "acc_stderr": 0.011289730684564982, + "acc_norm": 0.21928327645051193, + "acc_norm_stderr": 0.012091245787615734 + }, + "sciq": { + "acc": 0.705, + "acc_stderr": 0.014428554438445517, + "acc_norm": 0.658, + "acc_norm_stderr": 0.015008706182121731 + }, + "piqa": { + "acc": 0.6218715995647442, + "acc_stderr": 0.011313980666854535, + "acc_norm": 0.6109902067464635, + "acc_norm_stderr": 0.011374774974447464 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json new file mode 100644 index 0000000000000000000000000000000000000000..54d1b531d25ed098ed5bfa29b4e4b8c926cba0f5 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722695 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306625 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.01364760294240639 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.316548463356974 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.048523658709391 + }, + "hellaswag": { + "acc": 0.29047998406691894, + "acc_stderr": 0.004530560646902538, + "acc_norm": 0.3179645488946425, + "acc_norm_stderr": 0.004647338877642189 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5098658247829518, + "acc_stderr": 0.014049749833367596 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342655 + }, + "boolq": { + "acc": 0.4746177370030581, + "acc_stderr": 0.008733779541853504 + }, + "arc_easy": { + "acc": 0.42297979797979796, + "acc_stderr": 0.010137328382209104, + "acc_norm": 0.39057239057239057, + "acc_norm_stderr": 0.010011059112064229 + }, + "arc_challenge": { + "acc": 0.18515358361774745, + "acc_stderr": 0.011350774438389699, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.01220783999540731 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717607, + "acc_norm": 0.677, + "acc_norm_stderr": 0.014794927843348635 + }, + "piqa": { + "acc": 0.6316648531011969, + "acc_stderr": 0.011254089354334373, + "acc_norm": 0.6294885745375408, + "acc_norm_stderr": 0.01126782647544766 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-24-23_2shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-24-23_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..54d1b531d25ed098ed5bfa29b4e4b8c926cba0f5 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-24-23_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722695 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306625 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.01364760294240639 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.316548463356974 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.048523658709391 + }, + "hellaswag": { + "acc": 0.29047998406691894, + "acc_stderr": 0.004530560646902538, + "acc_norm": 0.3179645488946425, + "acc_norm_stderr": 0.004647338877642189 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5098658247829518, + "acc_stderr": 0.014049749833367596 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342655 + }, + "boolq": { + "acc": 0.4746177370030581, + "acc_stderr": 0.008733779541853504 + }, + "arc_easy": { + "acc": 0.42297979797979796, + "acc_stderr": 0.010137328382209104, + "acc_norm": 0.39057239057239057, + "acc_norm_stderr": 0.010011059112064229 + }, + "arc_challenge": { + "acc": 0.18515358361774745, + "acc_stderr": 0.011350774438389699, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.01220783999540731 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717607, + "acc_norm": 0.677, + "acc_norm_stderr": 0.014794927843348635 + }, + "piqa": { + "acc": 0.6316648531011969, + "acc_stderr": 0.011254089354334373, + "acc_norm": 0.6294885745375408, + "acc_norm_stderr": 0.01126782647544766 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json new file mode 100644 index 0000000000000000000000000000000000000000..cda6bb6c71edde06caad623a0f455b1977193eb7 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.312, + "acc_stderr": 0.014658474370509008 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934725 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3422885572139303 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.049236596391733084 + }, + "hellaswag": { + "acc": 0.291575383389763, + "acc_stderr": 0.004535589759202657, + "acc_norm": 0.32284405496912966, + "acc_norm_stderr": 0.004666080865179641 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529015 + }, + "storycloze_2016": { + "acc": 0.5740245857830037, + "acc_stderr": 0.011435014262181197 + }, + "boolq": { + "acc": 0.4688073394495413, + "acc_stderr": 0.008728020822889253 + }, + "arc_easy": { + "acc": 0.42424242424242425, + "acc_stderr": 0.010141333654958574, + "acc_norm": 0.38425925925925924, + "acc_norm_stderr": 0.009981120724601443 + }, + "arc_challenge": { + "acc": 0.18686006825938567, + "acc_stderr": 0.011391015649694391, + "acc_norm": 0.22440273037542663, + "acc_norm_stderr": 0.012191404938603838 + }, + "sciq": { + "acc": 0.723, + "acc_stderr": 0.014158794845306265, + "acc_norm": 0.682, + "acc_norm_stderr": 0.014734079309311901 + }, + "piqa": { + "acc": 0.6284004352557128, + "acc_stderr": 0.011274603006724743, + "acc_norm": 0.6196953210010882, + "acc_norm_stderr": 0.011326620892570314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-24-23_3shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-24-23_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..cda6bb6c71edde06caad623a0f455b1977193eb7 --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-24-23_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.312, + "acc_stderr": 0.014658474370509008 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934725 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3422885572139303 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.049236596391733084 + }, + "hellaswag": { + "acc": 0.291575383389763, + "acc_stderr": 0.004535589759202657, + "acc_norm": 0.32284405496912966, + "acc_norm_stderr": 0.004666080865179641 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529015 + }, + "storycloze_2016": { + "acc": 0.5740245857830037, + "acc_stderr": 0.011435014262181197 + }, + "boolq": { + "acc": 0.4688073394495413, + "acc_stderr": 0.008728020822889253 + }, + "arc_easy": { + "acc": 0.42424242424242425, + "acc_stderr": 0.010141333654958574, + "acc_norm": 0.38425925925925924, + "acc_norm_stderr": 0.009981120724601443 + }, + "arc_challenge": { + "acc": 0.18686006825938567, + "acc_stderr": 0.011391015649694391, + "acc_norm": 0.22440273037542663, + "acc_norm_stderr": 0.012191404938603838 + }, + "sciq": { + "acc": 0.723, + "acc_stderr": 0.014158794845306265, + "acc_norm": 0.682, + "acc_norm_stderr": 0.014734079309311901 + }, + "piqa": { + "acc": 0.6284004352557128, + "acc_stderr": 0.011274603006724743, + "acc_norm": 0.6196953210010882, + "acc_norm_stderr": 0.011326620892570314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3310b4b93a3c4ab25fd46b741a790e4dd0a3062d --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795025 + }, + "anli_r2": { + "acc": 0.352, + "acc_stderr": 0.01511040450564867 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618266 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.049236596391733084 + }, + "hellaswag": { + "acc": 0.29645488946425014, + "acc_stderr": 0.004557606227194286, + "acc_norm": 0.3234415455088628, + "acc_norm_stderr": 0.004668335725410298 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.4877663772691397, + "acc_stderr": 0.01404827882040562 + }, + "storycloze_2016": { + "acc": 0.5788348476750401, + "acc_stderr": 0.011417808278216117 + }, + "boolq": { + "acc": 0.44434250764525995, + "acc_stderr": 0.00869070599067338 + }, + "arc_easy": { + "acc": 0.42845117845117847, + "acc_stderr": 0.010154195733990975, + "acc_norm": 0.3930976430976431, + "acc_norm_stderr": 0.010022540618945312 + }, + "arc_challenge": { + "acc": 0.1962457337883959, + "acc_stderr": 0.01160601988141629, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326905 + }, + "sciq": { + "acc": 0.719, + "acc_stderr": 0.014221154708434929, + "acc_norm": 0.686, + "acc_norm_stderr": 0.014683991951087967 + }, + "piqa": { + "acc": 0.6273122959738846, + "acc_stderr": 0.01128131833289774, + "acc_norm": 0.6169749727965179, + "acc_norm_stderr": 0.01134208170908285 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-24-23_4shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-24-23_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..3310b4b93a3c4ab25fd46b741a790e4dd0a3062d --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-24-23_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795025 + }, + "anli_r2": { + "acc": 0.352, + "acc_stderr": 0.01511040450564867 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618266 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.049236596391733084 + }, + "hellaswag": { + "acc": 0.29645488946425014, + "acc_stderr": 0.004557606227194286, + "acc_norm": 0.3234415455088628, + "acc_norm_stderr": 0.004668335725410298 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.4877663772691397, + "acc_stderr": 0.01404827882040562 + }, + "storycloze_2016": { + "acc": 0.5788348476750401, + "acc_stderr": 0.011417808278216117 + }, + "boolq": { + "acc": 0.44434250764525995, + "acc_stderr": 0.00869070599067338 + }, + "arc_easy": { + "acc": 0.42845117845117847, + "acc_stderr": 0.010154195733990975, + "acc_norm": 0.3930976430976431, + "acc_norm_stderr": 0.010022540618945312 + }, + "arc_challenge": { + "acc": 0.1962457337883959, + "acc_stderr": 0.01160601988141629, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326905 + }, + "sciq": { + "acc": 0.719, + "acc_stderr": 0.014221154708434929, + "acc_norm": 0.686, + "acc_norm_stderr": 0.014683991951087967 + }, + "piqa": { + "acc": 0.6273122959738846, + "acc_stderr": 0.01128131833289774, + "acc_norm": 0.6169749727965179, + "acc_norm_stderr": 0.01134208170908285 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6183ecc6adfaacbb1093450e1eb3d28dab4f02dd --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.375, + "acc_stderr": 0.015316971293620996 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.01368860079329693 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3464373464373464 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29486158135829516, + "acc_stderr": 0.0045504861860190746, + "acc_norm": 0.32304321848237405, + "acc_norm_stderr": 0.0046668334527961925 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5027624309392266, + "acc_stderr": 0.014052271211616441 + }, + "storycloze_2016": { + "acc": 0.5809727418492785, + "acc_stderr": 0.011409804749706194 + }, + "boolq": { + "acc": 0.44128440366972477, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763676, + "acc_norm": 0.3985690235690236, + "acc_norm_stderr": 0.010046455400477931 + }, + "arc_challenge": { + "acc": 0.19197952218430034, + "acc_stderr": 0.011509598906598112, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.012207839995407303 + }, + "sciq": { + "acc": 0.721, + "acc_stderr": 0.014190150117612032, + "acc_norm": 0.682, + "acc_norm_stderr": 0.014734079309311901 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572347, + "acc_norm": 0.6180631120783461, + "acc_norm_stderr": 0.011335942557505228 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-24-23_5shots_backup.json b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-24-23_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..6183ecc6adfaacbb1093450e1eb3d28dab4f02dd --- /dev/null +++ b/evaluation/rankeval_r_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-24-23_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.375, + "acc_stderr": 0.015316971293620996 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.01368860079329693 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3464373464373464 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29486158135829516, + "acc_stderr": 0.0045504861860190746, + "acc_norm": 0.32304321848237405, + "acc_norm_stderr": 0.0046668334527961925 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5027624309392266, + "acc_stderr": 0.014052271211616441 + }, + "storycloze_2016": { + "acc": 0.5809727418492785, + "acc_stderr": 0.011409804749706194 + }, + "boolq": { + "acc": 0.44128440366972477, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763676, + "acc_norm": 0.3985690235690236, + "acc_norm_stderr": 0.010046455400477931 + }, + "arc_challenge": { + "acc": 0.19197952218430034, + "acc_stderr": 0.011509598906598112, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.012207839995407303 + }, + "sciq": { + "acc": 0.721, + "acc_stderr": 0.014190150117612032, + "acc_norm": 0.682, + "acc_norm_stderr": 0.014734079309311901 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572347, + "acc_norm": 0.6180631120783461, + "acc_norm_stderr": 0.011335942557505228 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..535953ca78587982851d3c36dcc1f87c79f74a10 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.01497675877162034,0 +anli_r2,acc,0.336,0.014944140233795027,0 +anli_r3,acc,0.3358333333333333,0.01363926119093288,0 +arc_challenge,acc,0.1885665529010239,0.011430897647675803,0 +arc_challenge,acc_norm,0.22610921501706485,0.01222420209706328,0 +arc_easy,acc,0.43308080808080807,0.010167478013701799,0 +arc_easy,acc_norm,0.38173400673400676,0.009968648851839667,0 +boolq,acc,0.5944954128440367,0.008587459055441612,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.63,0.04852365870939099,0 +hellaswag,acc,0.297450707030472,0.004562022467161891,0 +hellaswag,acc_norm,0.32374029077872934,0.004669459891917689,0 +piqa,acc,0.6158868335146899,0.011348160741479148,0 +piqa,acc_norm,0.6218715995647442,0.011313980666854533,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.735,0.013963164754809953,0 +sciq,acc_norm,0.668,0.014899597242811476,0 +storycloze_2016,acc,0.5905932656333511,0.01137105952719707,0 +winogrande,acc,0.5090765588003157,0.014050170094497707,0 diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4abedd92cdcec31ddf28e8290eaec20bbc61ebc9 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.01363926119093288 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.04852365870939099 + }, + "hellaswag": { + "acc": 0.297450707030472, + "acc_stderr": 0.004562022467161891, + "acc_norm": 0.32374029077872934, + "acc_norm_stderr": 0.004669459891917689 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5090765588003157, + "acc_stderr": 0.014050170094497707 + }, + "storycloze_2016": { + "acc": 0.5905932656333511, + "acc_stderr": 0.01137105952719707 + }, + "boolq": { + "acc": 0.5944954128440367, + "acc_stderr": 0.008587459055441612 + }, + "arc_easy": { + "acc": 0.43308080808080807, + "acc_stderr": 0.010167478013701799, + "acc_norm": 0.38173400673400676, + "acc_norm_stderr": 0.009968648851839667 + }, + "arc_challenge": { + "acc": 0.1885665529010239, + "acc_stderr": 0.011430897647675803, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.01222420209706328 + }, + "sciq": { + "acc": 0.735, + "acc_stderr": 0.013963164754809953, + "acc_norm": 0.668, + "acc_norm_stderr": 0.014899597242811476 + }, + "piqa": { + "acc": 0.6158868335146899, + "acc_stderr": 0.011348160741479148, + "acc_norm": 0.6218715995647442, + "acc_norm_stderr": 0.011313980666854533 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-17-38-12_0shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-17-38-12_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..4abedd92cdcec31ddf28e8290eaec20bbc61ebc9 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-17-38-12_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.01497675877162034 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795027 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.01363926119093288 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.04852365870939099 + }, + "hellaswag": { + "acc": 0.297450707030472, + "acc_stderr": 0.004562022467161891, + "acc_norm": 0.32374029077872934, + "acc_norm_stderr": 0.004669459891917689 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5090765588003157, + "acc_stderr": 0.014050170094497707 + }, + "storycloze_2016": { + "acc": 0.5905932656333511, + "acc_stderr": 0.01137105952719707 + }, + "boolq": { + "acc": 0.5944954128440367, + "acc_stderr": 0.008587459055441612 + }, + "arc_easy": { + "acc": 0.43308080808080807, + "acc_stderr": 0.010167478013701799, + "acc_norm": 0.38173400673400676, + "acc_norm_stderr": 0.009968648851839667 + }, + "arc_challenge": { + "acc": 0.1885665529010239, + "acc_stderr": 0.011430897647675803, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.01222420209706328 + }, + "sciq": { + "acc": 0.735, + "acc_stderr": 0.013963164754809953, + "acc_norm": 0.668, + "acc_norm_stderr": 0.014899597242811476 + }, + "piqa": { + "acc": 0.6158868335146899, + "acc_stderr": 0.011348160741479148, + "acc_norm": 0.6218715995647442, + "acc_norm_stderr": 0.011313980666854533 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1225e180862c365265004aeda1aa6084da376a1f --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.358, + "acc_stderr": 0.015167928865407559 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444236 + }, + "anli_r3": { + "acc": 0.32, + "acc_stderr": 0.013471620929769152 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.28651292802236195 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621504 + }, + "hellaswag": { + "acc": 0.2930691097390958, + "acc_stderr": 0.004542396269999213, + "acc_norm": 0.3207528380800637, + "acc_norm_stderr": 0.004658120152230808 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.4964483030781373, + "acc_stderr": 0.01405213114691586 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.01141582799434265 + }, + "boolq": { + "acc": 0.5125382262996941, + "acc_stderr": 0.008742304974218311 + }, + "arc_easy": { + "acc": 0.4313973063973064, + "acc_stderr": 0.010162752847747498, + "acc_norm": 0.38341750841750843, + "acc_norm_stderr": 0.009976995068264717 + }, + "arc_challenge": { + "acc": 0.19027303754266212, + "acc_stderr": 0.011470424179225709, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.012224202097063274 + }, + "sciq": { + "acc": 0.704, + "acc_stderr": 0.014442734941575022, + "acc_norm": 0.658, + "acc_norm_stderr": 0.015008706182121731 + }, + "piqa": { + "acc": 0.6240478781284005, + "acc_stderr": 0.011301098166895732, + "acc_norm": 0.6158868335146899, + "acc_norm_stderr": 0.011348160741479136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-17-38-12_1shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-17-38-12_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1225e180862c365265004aeda1aa6084da376a1f --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-17-38-12_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.358, + "acc_stderr": 0.015167928865407559 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444236 + }, + "anli_r3": { + "acc": 0.32, + "acc_stderr": 0.013471620929769152 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.28651292802236195 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621504 + }, + "hellaswag": { + "acc": 0.2930691097390958, + "acc_stderr": 0.004542396269999213, + "acc_norm": 0.3207528380800637, + "acc_norm_stderr": 0.004658120152230808 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.4964483030781373, + "acc_stderr": 0.01405213114691586 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.01141582799434265 + }, + "boolq": { + "acc": 0.5125382262996941, + "acc_stderr": 0.008742304974218311 + }, + "arc_easy": { + "acc": 0.4313973063973064, + "acc_stderr": 0.010162752847747498, + "acc_norm": 0.38341750841750843, + "acc_norm_stderr": 0.009976995068264717 + }, + "arc_challenge": { + "acc": 0.19027303754266212, + "acc_stderr": 0.011470424179225709, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.012224202097063274 + }, + "sciq": { + "acc": 0.704, + "acc_stderr": 0.014442734941575022, + "acc_norm": 0.658, + "acc_norm_stderr": 0.015008706182121731 + }, + "piqa": { + "acc": 0.6240478781284005, + "acc_stderr": 0.011301098166895732, + "acc_norm": 0.6158868335146899, + "acc_norm_stderr": 0.011348160741479136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json new file mode 100644 index 0000000000000000000000000000000000000000..35ed6c0b7155736172eed409d075c56cc12843c6 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342763 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.015120172605483696 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463653 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.316548463356974 + }, + "copa": { + "acc": 0.61, + "acc_stderr": 0.04902071300001975 + }, + "hellaswag": { + "acc": 0.2929695279824736, + "acc_stderr": 0.004541944342035901, + "acc_norm": 0.31866162119099783, + "acc_norm_stderr": 0.00465005215009441 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5836451095670764, + "acc_stderr": 0.011399490926937005 + }, + "boolq": { + "acc": 0.4776758409785933, + "acc_stderr": 0.00873633411558504 + }, + "arc_easy": { + "acc": 0.42634680134680136, + "acc_stderr": 0.010147858603835139, + "acc_norm": 0.3926767676767677, + "acc_norm_stderr": 0.010020646555538686 + }, + "arc_challenge": { + "acc": 0.18344709897610922, + "acc_stderr": 0.011310170179554543, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132879 + }, + "sciq": { + "acc": 0.73, + "acc_stderr": 0.014046255632633915, + "acc_norm": 0.677, + "acc_norm_stderr": 0.014794927843348633 + }, + "piqa": { + "acc": 0.6349292709466812, + "acc_stderr": 0.011233021830554829, + "acc_norm": 0.6251360174102285, + "acc_norm_stderr": 0.011294565805619019 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-17-36-57_2shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-17-36-57_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..35ed6c0b7155736172eed409d075c56cc12843c6 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-17-36-57_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342763 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.015120172605483696 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463653 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.316548463356974 + }, + "copa": { + "acc": 0.61, + "acc_stderr": 0.04902071300001975 + }, + "hellaswag": { + "acc": 0.2929695279824736, + "acc_stderr": 0.004541944342035901, + "acc_norm": 0.31866162119099783, + "acc_norm_stderr": 0.00465005215009441 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5836451095670764, + "acc_stderr": 0.011399490926937005 + }, + "boolq": { + "acc": 0.4776758409785933, + "acc_stderr": 0.00873633411558504 + }, + "arc_easy": { + "acc": 0.42634680134680136, + "acc_stderr": 0.010147858603835139, + "acc_norm": 0.3926767676767677, + "acc_norm_stderr": 0.010020646555538686 + }, + "arc_challenge": { + "acc": 0.18344709897610922, + "acc_stderr": 0.011310170179554543, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132879 + }, + "sciq": { + "acc": 0.73, + "acc_stderr": 0.014046255632633915, + "acc_norm": 0.677, + "acc_norm_stderr": 0.014794927843348633 + }, + "piqa": { + "acc": 0.6349292709466812, + "acc_stderr": 0.011233021830554829, + "acc_norm": 0.6251360174102285, + "acc_norm_stderr": 0.011294565805619019 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0d6363f2285674bac47e6f5331b217f8031ab121 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402704 + }, + "anli_r3": { + "acc": 0.3466666666666667, + "acc_stderr": 0.013744022550571949 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.347985347985348 + }, + "copa": { + "acc": 0.59, + "acc_stderr": 0.04943110704237101 + }, + "hellaswag": { + "acc": 0.2953594901414061, + "acc_stderr": 0.004552718360513099, + "acc_norm": 0.3241386178052181, + "acc_norm_stderr": 0.0046709553996411276 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.494869771112865, + "acc_stderr": 0.014051745961790513 + }, + "storycloze_2016": { + "acc": 0.5788348476750401, + "acc_stderr": 0.011417808278216117 + }, + "boolq": { + "acc": 0.4694189602446483, + "acc_stderr": 0.008728682900189723 + }, + "arc_easy": { + "acc": 0.4276094276094276, + "acc_stderr": 0.010151683397430679, + "acc_norm": 0.39141414141414144, + "acc_norm_stderr": 0.010014917532627812 + }, + "arc_challenge": { + "acc": 0.19027303754266212, + "acc_stderr": 0.011470424179225698, + "acc_norm": 0.2235494880546075, + "acc_norm_stderr": 0.012174896631202607 + }, + "sciq": { + "acc": 0.716, + "acc_stderr": 0.014267009061031314, + "acc_norm": 0.679, + "acc_norm_stderr": 0.014770821817934645 + }, + "piqa": { + "acc": 0.6289445048966268, + "acc_stderr": 0.011271222398600525, + "acc_norm": 0.6202393906420022, + "acc_norm_stderr": 0.011323483504715843 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-17-36-57_3shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-17-36-57_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0d6363f2285674bac47e6f5331b217f8031ab121 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-17-36-57_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402704 + }, + "anli_r3": { + "acc": 0.3466666666666667, + "acc_stderr": 0.013744022550571949 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.347985347985348 + }, + "copa": { + "acc": 0.59, + "acc_stderr": 0.04943110704237101 + }, + "hellaswag": { + "acc": 0.2953594901414061, + "acc_stderr": 0.004552718360513099, + "acc_norm": 0.3241386178052181, + "acc_norm_stderr": 0.0046709553996411276 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.494869771112865, + "acc_stderr": 0.014051745961790513 + }, + "storycloze_2016": { + "acc": 0.5788348476750401, + "acc_stderr": 0.011417808278216117 + }, + "boolq": { + "acc": 0.4694189602446483, + "acc_stderr": 0.008728682900189723 + }, + "arc_easy": { + "acc": 0.4276094276094276, + "acc_stderr": 0.010151683397430679, + "acc_norm": 0.39141414141414144, + "acc_norm_stderr": 0.010014917532627812 + }, + "arc_challenge": { + "acc": 0.19027303754266212, + "acc_stderr": 0.011470424179225698, + "acc_norm": 0.2235494880546075, + "acc_norm_stderr": 0.012174896631202607 + }, + "sciq": { + "acc": 0.716, + "acc_stderr": 0.014267009061031314, + "acc_norm": 0.679, + "acc_norm_stderr": 0.014770821817934645 + }, + "piqa": { + "acc": 0.6289445048966268, + "acc_stderr": 0.011271222398600525, + "acc_norm": 0.6202393906420022, + "acc_norm_stderr": 0.011323483504715843 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb7e9f5bc215c037f7d36997a1507c959ea2966 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795025 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.01512017260548369 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.01365589718546366 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.04923659639173309 + }, + "hellaswag": { + "acc": 0.2938657637920733, + "acc_stderr": 0.004546002255456781, + "acc_norm": 0.32204740091615214, + "acc_norm_stderr": 0.00466306082837678 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.48303078137332284, + "acc_stderr": 0.014044390401612969 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342653 + }, + "boolq": { + "acc": 0.4437308868501529, + "acc_stderr": 0.008689501105367405 + }, + "arc_easy": { + "acc": 0.43013468013468015, + "acc_stderr": 0.010159130445178514, + "acc_norm": 0.39225589225589225, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.19795221843003413, + "acc_stderr": 0.011643990971573395, + "acc_norm": 0.23122866894197952, + "acc_norm_stderr": 0.012320858834772266 + }, + "sciq": { + "acc": 0.721, + "acc_stderr": 0.01419015011761203, + "acc_norm": 0.686, + "acc_norm_stderr": 0.014683991951087967 + }, + "piqa": { + "acc": 0.6322089227421109, + "acc_stderr": 0.011250616646678797, + "acc_norm": 0.6240478781284005, + "acc_norm_stderr": 0.011301098166895724 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-17-38-12_4shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-17-38-12_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb7e9f5bc215c037f7d36997a1507c959ea2966 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-17-38-12_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795025 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.01512017260548369 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.01365589718546366 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.6, + "acc_stderr": 0.04923659639173309 + }, + "hellaswag": { + "acc": 0.2938657637920733, + "acc_stderr": 0.004546002255456781, + "acc_norm": 0.32204740091615214, + "acc_norm_stderr": 0.00466306082837678 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.48303078137332284, + "acc_stderr": 0.014044390401612969 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342653 + }, + "boolq": { + "acc": 0.4437308868501529, + "acc_stderr": 0.008689501105367405 + }, + "arc_easy": { + "acc": 0.43013468013468015, + "acc_stderr": 0.010159130445178514, + "acc_norm": 0.39225589225589225, + "acc_norm_stderr": 0.010018744689650043 + }, + "arc_challenge": { + "acc": 0.19795221843003413, + "acc_stderr": 0.011643990971573395, + "acc_norm": 0.23122866894197952, + "acc_norm_stderr": 0.012320858834772266 + }, + "sciq": { + "acc": 0.721, + "acc_stderr": 0.01419015011761203, + "acc_norm": 0.686, + "acc_norm_stderr": 0.014683991951087967 + }, + "piqa": { + "acc": 0.6322089227421109, + "acc_stderr": 0.011250616646678797, + "acc_norm": 0.6240478781284005, + "acc_norm_stderr": 0.011301098166895724 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e6136f6b97356b8a97c5d72412fb4861e70d6380 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.368, + "acc_stderr": 0.015258073561521802 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932577 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002515 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3459575611066344 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.2944632543318064, + "acc_stderr": 0.00454869574962096, + "acc_norm": 0.32423819956184025, + "acc_norm_stderr": 0.0046713286732178 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.4972375690607735, + "acc_stderr": 0.014052271211616441 + }, + "storycloze_2016": { + "acc": 0.5836451095670764, + "acc_stderr": 0.011399490926937006 + }, + "boolq": { + "acc": 0.44128440366972477, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763678, + "acc_norm": 0.39941077441077444, + "acc_norm_stderr": 0.010050018228742115 + }, + "arc_challenge": { + "acc": 0.19283276450511946, + "acc_stderr": 0.011529055465663338, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132873 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574883 + }, + "piqa": { + "acc": 0.6278563656147987, + "acc_stderr": 0.01127796831359274, + "acc_norm": 0.6207834602829162, + "acc_norm_stderr": 0.011320331012905077 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-17-38-12_5shots_backup.json b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-17-38-12_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..e6136f6b97356b8a97c5d72412fb4861e70d6380 --- /dev/null +++ b/evaluation/rankeval_s_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-17-38-12_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.368, + "acc_stderr": 0.015258073561521802 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932577 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002515 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3459575611066344 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.2944632543318064, + "acc_stderr": 0.00454869574962096, + "acc_norm": 0.32423819956184025, + "acc_norm_stderr": 0.0046713286732178 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.4972375690607735, + "acc_stderr": 0.014052271211616441 + }, + "storycloze_2016": { + "acc": 0.5836451095670764, + "acc_stderr": 0.011399490926937006 + }, + "boolq": { + "acc": 0.44128440366972477, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.4297138047138047, + "acc_stderr": 0.010157908005763678, + "acc_norm": 0.39941077441077444, + "acc_norm_stderr": 0.010050018228742115 + }, + "arc_challenge": { + "acc": 0.19283276450511946, + "acc_stderr": 0.011529055465663338, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132873 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574883 + }, + "piqa": { + "acc": 0.6278563656147987, + "acc_stderr": 0.01127796831359274, + "acc_norm": 0.6207834602829162, + "acc_norm_stderr": 0.011320331012905077 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.csv b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..1961804954bcf82e11ee8120c57cfe24e2416656 --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.333,0.014910846164229868,0 +anli_r2,acc,0.339,0.014976758771620344,0 +anli_r3,acc,0.33916666666666667,0.013672343491681819,0 +arc_challenge,acc,0.18600682593856654,0.011370940183266749,0 +arc_challenge,acc_norm,0.22610921501706485,0.01222420209706328,0 +arc_easy,acc,0.42003367003367004,0.010127718838529398,0 +arc_easy,acc_norm,0.3728956228956229,0.009922743197129255,0 +boolq,acc,0.6051987767584098,0.008549304887647411,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.62,0.04878317312145632,0 +hellaswag,acc,0.2949611631149173,0.004550933142528753,0 +hellaswag,acc_norm,0.32463652658832903,0.004672819355838551,0 +piqa,acc,0.6251360174102285,0.011294565805619017,0 +piqa,acc_norm,0.6224156692056583,0.011310782787145772,0 +rte,acc,0.5342960288808665,0.030025579819366422,0 +sciq,acc,0.735,0.013963164754809949,0 +sciq,acc_norm,0.656,0.015029633724408945,0 +storycloze_2016,acc,0.5873864243719936,0.011384472322969045,0 +winogrande,acc,0.516179952644041,0.014045126130978601,0 diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.json new file mode 100644 index 0000000000000000000000000000000000000000..91dacb78cd6246f324b5d0c5b28d77cf63cc725d --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.333, + "acc_stderr": 0.014910846164229868 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.2949611631149173, + "acc_stderr": 0.004550933142528753, + "acc_norm": 0.32463652658832903, + "acc_norm_stderr": 0.004672819355838551 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.516179952644041, + "acc_stderr": 0.014045126130978601 + }, + "storycloze_2016": { + "acc": 0.5873864243719936, + "acc_stderr": 0.011384472322969045 + }, + "boolq": { + "acc": 0.6051987767584098, + "acc_stderr": 0.008549304887647411 + }, + "arc_easy": { + "acc": 0.42003367003367004, + "acc_stderr": 0.010127718838529398, + "acc_norm": 0.3728956228956229, + "acc_norm_stderr": 0.009922743197129255 + }, + "arc_challenge": { + "acc": 0.18600682593856654, + "acc_stderr": 0.011370940183266749, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.01222420209706328 + }, + "sciq": { + "acc": 0.735, + "acc_stderr": 0.013963164754809949, + "acc_norm": 0.656, + "acc_norm_stderr": 0.015029633724408945 + }, + "piqa": { + "acc": 0.6251360174102285, + "acc_stderr": 0.011294565805619017, + "acc_norm": 0.6224156692056583, + "acc_norm_stderr": 0.011310782787145772 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step42000_2023-02-08-13-42-29_0shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step42000_2023-02-08-13-42-29_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..91dacb78cd6246f324b5d0c5b28d77cf63cc725d --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step42000_2023-02-08-13-42-29_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.333, + "acc_stderr": 0.014910846164229868 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681819 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145632 + }, + "hellaswag": { + "acc": 0.2949611631149173, + "acc_stderr": 0.004550933142528753, + "acc_norm": 0.32463652658832903, + "acc_norm_stderr": 0.004672819355838551 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.516179952644041, + "acc_stderr": 0.014045126130978601 + }, + "storycloze_2016": { + "acc": 0.5873864243719936, + "acc_stderr": 0.011384472322969045 + }, + "boolq": { + "acc": 0.6051987767584098, + "acc_stderr": 0.008549304887647411 + }, + "arc_easy": { + "acc": 0.42003367003367004, + "acc_stderr": 0.010127718838529398, + "acc_norm": 0.3728956228956229, + "acc_norm_stderr": 0.009922743197129255 + }, + "arc_challenge": { + "acc": 0.18600682593856654, + "acc_stderr": 0.011370940183266749, + "acc_norm": 0.22610921501706485, + "acc_norm_stderr": 0.01222420209706328 + }, + "sciq": { + "acc": 0.735, + "acc_stderr": 0.013963164754809949, + "acc_norm": 0.656, + "acc_norm_stderr": 0.015029633724408945 + }, + "piqa": { + "acc": 0.6251360174102285, + "acc_stderr": 0.011294565805619017, + "acc_norm": 0.6224156692056583, + "acc_norm_stderr": 0.011310782787145772 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1c229b3bc0d2590f424345659babe6f4d7dc99ee --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002505 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.2712571726656234 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.04793724854411019 + }, + "hellaswag": { + "acc": 0.29396534554869547, + "acc_stderr": 0.004546451825028366, + "acc_norm": 0.3170683130850428, + "acc_norm_stderr": 0.004643832742876639 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5067087608524072, + "acc_stderr": 0.014051220692330349 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5587155963302752, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.41203703703703703, + "acc_stderr": 0.010099765857562773, + "acc_norm": 0.3720538720538721, + "acc_norm_stderr": 0.009918187193096468 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.2167235494880546, + "acc_norm_stderr": 0.012040156713481192 + }, + "sciq": { + "acc": 0.685, + "acc_stderr": 0.014696631960792492, + "acc_norm": 0.632, + "acc_norm_stderr": 0.0152580735615218 + }, + "piqa": { + "acc": 0.6294885745375408, + "acc_stderr": 0.011267826475447665, + "acc_norm": 0.6262241566920566, + "acc_norm_stderr": 0.011287972563201017 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step42000_2023-02-08-13-42-29_1shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step42000_2023-02-08-13-42-29_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1c229b3bc0d2590f424345659babe6f4d7dc99ee --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step42000_2023-02-08-13-42-29_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002505 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.2712571726656234 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.04793724854411019 + }, + "hellaswag": { + "acc": 0.29396534554869547, + "acc_stderr": 0.004546451825028366, + "acc_norm": 0.3170683130850428, + "acc_norm_stderr": 0.004643832742876639 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5067087608524072, + "acc_stderr": 0.014051220692330349 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5587155963302752, + "acc_stderr": 0.008684548127832634 + }, + "arc_easy": { + "acc": 0.41203703703703703, + "acc_stderr": 0.010099765857562773, + "acc_norm": 0.3720538720538721, + "acc_norm_stderr": 0.009918187193096468 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.2167235494880546, + "acc_norm_stderr": 0.012040156713481192 + }, + "sciq": { + "acc": 0.685, + "acc_stderr": 0.014696631960792492, + "acc_norm": 0.632, + "acc_norm_stderr": 0.0152580735615218 + }, + "piqa": { + "acc": 0.6294885745375408, + "acc_stderr": 0.011267826475447665, + "acc_norm": 0.6262241566920566, + "acc_norm_stderr": 0.011287972563201017 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b7f200cfd906081bd84a5f0681e7264cecdb6caa --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977892 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934732 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2791044776119403 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.2887870942043418, + "acc_stderr": 0.004522725412556968, + "acc_norm": 0.31517625970922125, + "acc_norm_stderr": 0.004636365534819762 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5809727418492785, + "acc_stderr": 0.011409804749706194 + }, + "boolq": { + "acc": 0.5483180428134556, + "acc_stderr": 0.008704126206159355 + }, + "arc_easy": { + "acc": 0.398989898989899, + "acc_stderr": 0.010048240683798759, + "acc_norm": 0.36784511784511786, + "acc_norm_stderr": 0.009894923464455196 + }, + "arc_challenge": { + "acc": 0.18515358361774745, + "acc_stderr": 0.011350774438389695, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326914 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.634, + "acc_norm_stderr": 0.015240612726405756 + }, + "piqa": { + "acc": 0.6327529923830251, + "acc_stderr": 0.011247128539690563, + "acc_norm": 0.6175190424374319, + "acc_norm_stderr": 0.011339019654272345 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step42000_2023-02-08-13-42-29_2shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step42000_2023-02-08-13-42-29_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b7f200cfd906081bd84a5f0681e7264cecdb6caa --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step42000_2023-02-08-13-42-29_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.014671272822977892 + }, + "anli_r2": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934732 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2791044776119403 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.2887870942043418, + "acc_stderr": 0.004522725412556968, + "acc_norm": 0.31517625970922125, + "acc_norm_stderr": 0.004636365534819762 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5809727418492785, + "acc_stderr": 0.011409804749706194 + }, + "boolq": { + "acc": 0.5483180428134556, + "acc_stderr": 0.008704126206159355 + }, + "arc_easy": { + "acc": 0.398989898989899, + "acc_stderr": 0.010048240683798759, + "acc_norm": 0.36784511784511786, + "acc_norm_stderr": 0.009894923464455196 + }, + "arc_challenge": { + "acc": 0.18515358361774745, + "acc_stderr": 0.011350774438389695, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326914 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.634, + "acc_norm_stderr": 0.015240612726405756 + }, + "piqa": { + "acc": 0.6327529923830251, + "acc_stderr": 0.011247128539690563, + "acc_norm": 0.6175190424374319, + "acc_norm_stderr": 0.011339019654272345 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0e947d320d4d59e8f2a74f8b618632547bf39bfa --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.01477082181793465 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681822 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2593406593406593 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29087831109340767, + "acc_stderr": 0.004532393111248679, + "acc_norm": 0.3136825333598885, + "acc_norm_stderr": 0.004630407476835188 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5146014206787688, + "acc_stderr": 0.014046492383275835 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5495412844036697, + "acc_stderr": 0.008702022442950878 + }, + "arc_easy": { + "acc": 0.4090909090909091, + "acc_stderr": 0.010088775152615779, + "acc_norm": 0.3686868686868687, + "acc_norm_stderr": 0.009899640855681038 + }, + "arc_challenge": { + "acc": 0.18771331058020477, + "acc_stderr": 0.011411001314155136, + "acc_norm": 0.22098976109215018, + "acc_norm_stderr": 0.012124929206818258 + }, + "sciq": { + "acc": 0.694, + "acc_stderr": 0.014580006055436972, + "acc_norm": 0.652, + "acc_norm_stderr": 0.015070604603768408 + }, + "piqa": { + "acc": 0.6354733405875952, + "acc_stderr": 0.011229456510295966, + "acc_norm": 0.6262241566920566, + "acc_norm_stderr": 0.011287972563201014 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step42000_2023-02-08-13-42-29_3shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step42000_2023-02-08-13-42-29_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0e947d320d4d59e8f2a74f8b618632547bf39bfa --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step42000_2023-02-08-13-42-29_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.321, + "acc_stderr": 0.01477082181793465 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681822 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2593406593406593 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29087831109340767, + "acc_stderr": 0.004532393111248679, + "acc_norm": 0.3136825333598885, + "acc_norm_stderr": 0.004630407476835188 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5146014206787688, + "acc_stderr": 0.014046492383275835 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5495412844036697, + "acc_stderr": 0.008702022442950878 + }, + "arc_easy": { + "acc": 0.4090909090909091, + "acc_stderr": 0.010088775152615779, + "acc_norm": 0.3686868686868687, + "acc_norm_stderr": 0.009899640855681038 + }, + "arc_challenge": { + "acc": 0.18771331058020477, + "acc_stderr": 0.011411001314155136, + "acc_norm": 0.22098976109215018, + "acc_norm_stderr": 0.012124929206818258 + }, + "sciq": { + "acc": 0.694, + "acc_stderr": 0.014580006055436972, + "acc_norm": 0.652, + "acc_norm_stderr": 0.015070604603768408 + }, + "piqa": { + "acc": 0.6354733405875952, + "acc_stderr": 0.011229456510295966, + "acc_norm": 0.6262241566920566, + "acc_norm_stderr": 0.011287972563201014 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4b16f771850d620fd8400d5bc6546a719a289f18 --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402697 + }, + "anli_r3": { + "acc": 0.355, + "acc_stderr": 0.013819249004047298 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942397, + "f1": 0.29572649572649573 + }, + "copa": { + "acc": 0.57, + "acc_stderr": 0.04975698519562428 + }, + "hellaswag": { + "acc": 0.287293367855009, + "acc_stderr": 0.004515748192605717, + "acc_norm": 0.3125871340370444, + "acc_norm_stderr": 0.004626002828389158 + }, + "rte": { + "acc": 0.4657039711191336, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5169692186266772, + "acc_stderr": 0.014044390401612976 + }, + "storycloze_2016": { + "acc": 0.5750935328701229, + "acc_stderr": 0.011431286492205843 + }, + "boolq": { + "acc": 0.5513761467889908, + "acc_stderr": 0.008698767182005272 + }, + "arc_easy": { + "acc": 0.4057239057239057, + "acc_stderr": 0.010075755540128876, + "acc_norm": 0.37626262626262624, + "acc_norm_stderr": 0.009940646221513786 + }, + "arc_challenge": { + "acc": 0.1962457337883959, + "acc_stderr": 0.011606019881416286, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326905 + }, + "sciq": { + "acc": 0.691, + "acc_stderr": 0.014619600977206486, + "acc_norm": 0.658, + "acc_norm_stderr": 0.01500870618212173 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572341, + "acc_norm": 0.6175190424374319, + "acc_norm_stderr": 0.011339019654272347 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step42000_2023-02-08-13-42-29_4shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step42000_2023-02-08-13-42-29_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..4b16f771850d620fd8400d5bc6546a719a289f18 --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step42000_2023-02-08-13-42-29_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402697 + }, + "anli_r3": { + "acc": 0.355, + "acc_stderr": 0.013819249004047298 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942397, + "f1": 0.29572649572649573 + }, + "copa": { + "acc": 0.57, + "acc_stderr": 0.04975698519562428 + }, + "hellaswag": { + "acc": 0.287293367855009, + "acc_stderr": 0.004515748192605717, + "acc_norm": 0.3125871340370444, + "acc_norm_stderr": 0.004626002828389158 + }, + "rte": { + "acc": 0.4657039711191336, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5169692186266772, + "acc_stderr": 0.014044390401612976 + }, + "storycloze_2016": { + "acc": 0.5750935328701229, + "acc_stderr": 0.011431286492205843 + }, + "boolq": { + "acc": 0.5513761467889908, + "acc_stderr": 0.008698767182005272 + }, + "arc_easy": { + "acc": 0.4057239057239057, + "acc_stderr": 0.010075755540128876, + "acc_norm": 0.37626262626262624, + "acc_norm_stderr": 0.009940646221513786 + }, + "arc_challenge": { + "acc": 0.1962457337883959, + "acc_stderr": 0.011606019881416286, + "acc_norm": 0.22781569965870307, + "acc_norm_stderr": 0.012256708602326905 + }, + "sciq": { + "acc": 0.691, + "acc_stderr": 0.014619600977206486, + "acc_norm": 0.658, + "acc_norm_stderr": 0.01500870618212173 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572341, + "acc_norm": 0.6175190424374319, + "acc_norm_stderr": 0.011339019654272347 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5.json new file mode 100644 index 0000000000000000000000000000000000000000..42bb4d52fbbba83e39a37035692457012fb91ebd --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.353, + "acc_stderr": 0.01512017260548369 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3575, + "acc_stderr": 0.013840921245257794 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.34521263958184845 + }, + "copa": { + "acc": 0.56, + "acc_stderr": 0.04988876515698589 + }, + "hellaswag": { + "acc": 0.2891854212308305, + "acc_stderr": 0.004524575892952968, + "acc_norm": 0.3157737502489544, + "acc_norm_stderr": 0.004638733202373885 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5019731649565904, + "acc_stderr": 0.014052376259225632 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342657 + }, + "boolq": { + "acc": 0.5370030581039755, + "acc_stderr": 0.008721074177479658 + }, + "arc_easy": { + "acc": 0.4031986531986532, + "acc_stderr": 0.010065668576794787, + "acc_norm": 0.37457912457912457, + "acc_norm_stderr": 0.00993175882041061 + }, + "arc_challenge": { + "acc": 0.189419795221843, + "acc_stderr": 0.01145070511591077, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132873 + }, + "sciq": { + "acc": 0.71, + "acc_stderr": 0.01435639599990569, + "acc_norm": 0.665, + "acc_norm_stderr": 0.014933117490932572 + }, + "piqa": { + "acc": 0.6229597388465724, + "acc_stderr": 0.011307569752543902, + "acc_norm": 0.6126224156692056, + "acc_norm_stderr": 0.011366038083435908 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step42000_2023-02-08-13-42-29_5shots_backup.json b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step42000_2023-02-08-13-42-29_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..42bb4d52fbbba83e39a37035692457012fb91ebd --- /dev/null +++ b/evaluation/rankeval_s_denoiser_44b/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step42000_2023-02-08-13-42-29_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.353, + "acc_stderr": 0.01512017260548369 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.3575, + "acc_stderr": 0.013840921245257794 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.34521263958184845 + }, + "copa": { + "acc": 0.56, + "acc_stderr": 0.04988876515698589 + }, + "hellaswag": { + "acc": 0.2891854212308305, + "acc_stderr": 0.004524575892952968, + "acc_norm": 0.3157737502489544, + "acc_norm_stderr": 0.004638733202373885 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5019731649565904, + "acc_stderr": 0.014052376259225632 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342657 + }, + "boolq": { + "acc": 0.5370030581039755, + "acc_stderr": 0.008721074177479658 + }, + "arc_easy": { + "acc": 0.4031986531986532, + "acc_stderr": 0.010065668576794787, + "acc_norm": 0.37457912457912457, + "acc_norm_stderr": 0.00993175882041061 + }, + "arc_challenge": { + "acc": 0.189419795221843, + "acc_stderr": 0.01145070511591077, + "acc_norm": 0.22696245733788395, + "acc_norm_stderr": 0.012240491536132873 + }, + "sciq": { + "acc": 0.71, + "acc_stderr": 0.01435639599990569, + "acc_norm": 0.665, + "acc_norm_stderr": 0.014933117490932572 + }, + "piqa": { + "acc": 0.6229597388465724, + "acc_stderr": 0.011307569752543902, + "acc_norm": 0.6126224156692056, + "acc_norm_stderr": 0.011366038083435908 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..83edbcddeb91998f439270a4ac36f32b53d1b143 --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.338,0.014965960710224473,0 +anli_r2,acc,0.333,0.01491084616422986,0 +anli_r3,acc,0.335,0.01363087184382148,0 +arc_challenge,acc,0.181740614334471,0.011269198948880236,0 +arc_challenge,acc_norm,0.22098976109215018,0.012124929206818258,0 +arc_easy,acc,0.43434343434343436,0.010170943451269425,0 +arc_easy,acc_norm,0.382996632996633,0.009974920384536472,0 +boolq,acc,0.5935779816513761,0.008590531708882188,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.63,0.048523658709391,0 +hellaswag,acc,0.29725154351722766,0.004561141293448468,0 +hellaswag,acc_norm,0.3256323441545509,0.004676529200753,0 +piqa,acc,0.6300326441784548,0.011264415223415281,0 +piqa,acc_norm,0.6322089227421109,0.011250616646678792,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.736,0.013946271849440472,0 +sciq,acc_norm,0.668,0.014899597242811476,0 +storycloze_2016,acc,0.5916622127204704,0.011366477562142522,0 +winogrande,acc,0.5090765588003157,0.01405017009449771,0 diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e207711b7ae5cfed9a1acb8852d145b2e122052c --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224473 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.01491084616422986 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.01363087184382148 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.048523658709391 + }, + "hellaswag": { + "acc": 0.29725154351722766, + "acc_stderr": 0.004561141293448468, + "acc_norm": 0.3256323441545509, + "acc_norm_stderr": 0.004676529200753 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5090765588003157, + "acc_stderr": 0.01405017009449771 + }, + "storycloze_2016": { + "acc": 0.5916622127204704, + "acc_stderr": 0.011366477562142522 + }, + "boolq": { + "acc": 0.5935779816513761, + "acc_stderr": 0.008590531708882188 + }, + "arc_easy": { + "acc": 0.43434343434343436, + "acc_stderr": 0.010170943451269425, + "acc_norm": 0.382996632996633, + "acc_norm_stderr": 0.009974920384536472 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.22098976109215018, + "acc_norm_stderr": 0.012124929206818258 + }, + "sciq": { + "acc": 0.736, + "acc_stderr": 0.013946271849440472, + "acc_norm": 0.668, + "acc_norm_stderr": 0.014899597242811476 + }, + "piqa": { + "acc": 0.6300326441784548, + "acc_stderr": 0.011264415223415281, + "acc_norm": 0.6322089227421109, + "acc_norm_stderr": 0.011250616646678792 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-08-31_0shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-08-31_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..e207711b7ae5cfed9a1acb8852d145b2e122052c --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_0_lm-eval_global_step52452_2023-02-09-23-08-31_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224473 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.01491084616422986 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.01363087184382148 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.63, + "acc_stderr": 0.048523658709391 + }, + "hellaswag": { + "acc": 0.29725154351722766, + "acc_stderr": 0.004561141293448468, + "acc_norm": 0.3256323441545509, + "acc_norm_stderr": 0.004676529200753 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5090765588003157, + "acc_stderr": 0.01405017009449771 + }, + "storycloze_2016": { + "acc": 0.5916622127204704, + "acc_stderr": 0.011366477562142522 + }, + "boolq": { + "acc": 0.5935779816513761, + "acc_stderr": 0.008590531708882188 + }, + "arc_easy": { + "acc": 0.43434343434343436, + "acc_stderr": 0.010170943451269425, + "acc_norm": 0.382996632996633, + "acc_norm_stderr": 0.009974920384536472 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.22098976109215018, + "acc_norm_stderr": 0.012124929206818258 + }, + "sciq": { + "acc": 0.736, + "acc_stderr": 0.013946271849440472, + "acc_norm": 0.668, + "acc_norm_stderr": 0.014899597242811476 + }, + "piqa": { + "acc": 0.6300326441784548, + "acc_stderr": 0.011264415223415281, + "acc_norm": 0.6322089227421109, + "acc_norm_stderr": 0.011250616646678792 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6bfe6f5a8dd21e4d1c6f9fd43b08ab92c8b12c9b --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798594 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.32, + "acc_stderr": 0.01347162092976915 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.27365967365967364 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2909778928500299, + "acc_stderr": 0.004532850566893522, + "acc_norm": 0.31955785700059747, + "acc_norm_stderr": 0.004653523038369371 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5019731649565904, + "acc_stderr": 0.014052376259225632 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5122324159021406, + "acc_stderr": 0.008742437504570405 + }, + "arc_easy": { + "acc": 0.43097643097643096, + "acc_stderr": 0.010161552863493744, + "acc_norm": 0.3792087542087542, + "acc_norm_stderr": 0.00995589166886556 + }, + "arc_challenge": { + "acc": 0.1885665529010239, + "acc_stderr": 0.0114308976476758, + "acc_norm": 0.2158703071672355, + "acc_norm_stderr": 0.012022975360030668 + }, + "sciq": { + "acc": 0.703, + "acc_stderr": 0.0144568322948011, + "acc_norm": 0.659, + "acc_norm_stderr": 0.014998131348402706 + }, + "piqa": { + "acc": 0.6224156692056583, + "acc_stderr": 0.011310782787145781, + "acc_norm": 0.6158868335146899, + "acc_norm_stderr": 0.011348160741479136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-08-31_1shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-08-31_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..6bfe6f5a8dd21e4d1c6f9fd43b08ab92c8b12c9b --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_1_lm-eval_global_step52452_2023-02-09-23-08-31_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.359, + "acc_stderr": 0.015177264224798594 + }, + "anli_r2": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r3": { + "acc": 0.32, + "acc_stderr": 0.01347162092976915 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.27365967365967364 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2909778928500299, + "acc_stderr": 0.004532850566893522, + "acc_norm": 0.31955785700059747, + "acc_norm_stderr": 0.004653523038369371 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5019731649565904, + "acc_stderr": 0.014052376259225632 + }, + "storycloze_2016": { + "acc": 0.5783003741314805, + "acc_stderr": 0.011419774841868156 + }, + "boolq": { + "acc": 0.5122324159021406, + "acc_stderr": 0.008742437504570405 + }, + "arc_easy": { + "acc": 0.43097643097643096, + "acc_stderr": 0.010161552863493744, + "acc_norm": 0.3792087542087542, + "acc_norm_stderr": 0.00995589166886556 + }, + "arc_challenge": { + "acc": 0.1885665529010239, + "acc_stderr": 0.0114308976476758, + "acc_norm": 0.2158703071672355, + "acc_norm_stderr": 0.012022975360030668 + }, + "sciq": { + "acc": 0.703, + "acc_stderr": 0.0144568322948011, + "acc_norm": 0.659, + "acc_norm_stderr": 0.014998131348402706 + }, + "piqa": { + "acc": 0.6224156692056583, + "acc_stderr": 0.011310782787145781, + "acc_norm": 0.6158868335146899, + "acc_norm_stderr": 0.011348160741479136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c554847933fad3322a3d014af9142b1cb73ffd4d --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.312, + "acc_stderr": 0.014658474370509001 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932889 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.30579096045197734 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29286994622585144, + "acc_stderr": 0.004541492151639241, + "acc_norm": 0.31736705835490936, + "acc_norm_stderr": 0.004645003662067885 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5082872928176796, + "acc_stderr": 0.014050555322824189 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342657 + }, + "boolq": { + "acc": 0.4709480122324159, + "acc_stderr": 0.008730280528451546 + }, + "arc_easy": { + "acc": 0.4212962962962963, + "acc_stderr": 0.010131882498193131, + "acc_norm": 0.3888888888888889, + "acc_norm_stderr": 0.010003248335313755 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.22866894197952217, + "acc_norm_stderr": 0.0122728535825408 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717605, + "acc_norm": 0.676, + "acc_norm_stderr": 0.01480686473373886 + }, + "piqa": { + "acc": 0.6349292709466812, + "acc_stderr": 0.011233021830554826, + "acc_norm": 0.6240478781284005, + "acc_norm_stderr": 0.011301098166895727 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-08-31_2shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-08-31_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c554847933fad3322a3d014af9142b1cb73ffd4d --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_2_lm-eval_global_step52452_2023-02-09-23-08-31_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.312, + "acc_stderr": 0.014658474370509001 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932889 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.30579096045197734 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29286994622585144, + "acc_stderr": 0.004541492151639241, + "acc_norm": 0.31736705835490936, + "acc_norm_stderr": 0.004645003662067885 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5082872928176796, + "acc_stderr": 0.014050555322824189 + }, + "storycloze_2016": { + "acc": 0.5793693212185996, + "acc_stderr": 0.011415827994342657 + }, + "boolq": { + "acc": 0.4709480122324159, + "acc_stderr": 0.008730280528451546 + }, + "arc_easy": { + "acc": 0.4212962962962963, + "acc_stderr": 0.010131882498193131, + "acc_norm": 0.3888888888888889, + "acc_norm_stderr": 0.010003248335313755 + }, + "arc_challenge": { + "acc": 0.181740614334471, + "acc_stderr": 0.011269198948880236, + "acc_norm": 0.22866894197952217, + "acc_norm_stderr": 0.0122728535825408 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717605, + "acc_norm": 0.676, + "acc_norm_stderr": 0.01480686473373886 + }, + "piqa": { + "acc": 0.6349292709466812, + "acc_stderr": 0.011233021830554826, + "acc_norm": 0.6240478781284005, + "acc_norm_stderr": 0.011301098166895727 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json new file mode 100644 index 0000000000000000000000000000000000000000..6507e5c1dacc4734561378b98ec5cbd5eedce9fe --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087967 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3218559218559219 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29286994622585144, + "acc_stderr": 0.004541492151639243, + "acc_norm": 0.3227444732125075, + "acc_norm_stderr": 0.004665704208339039 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.4925019731649566, + "acc_stderr": 0.01405090552122858 + }, + "storycloze_2016": { + "acc": 0.5729556386958845, + "acc_stderr": 0.01143868739857839 + }, + "boolq": { + "acc": 0.4675840978593272, + "acc_stderr": 0.008726657178723137 + }, + "arc_easy": { + "acc": 0.42297979797979796, + "acc_stderr": 0.010137328382209099, + "acc_norm": 0.3808922558922559, + "acc_norm_stderr": 0.009964428212260379 + }, + "arc_challenge": { + "acc": 0.19197952218430034, + "acc_stderr": 0.011509598906598098, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.0122078399954073 + }, + "sciq": { + "acc": 0.72, + "acc_stderr": 0.014205696104091496, + "acc_norm": 0.679, + "acc_norm_stderr": 0.014770821817934645 + }, + "piqa": { + "acc": 0.6273122959738846, + "acc_stderr": 0.011281318332897734, + "acc_norm": 0.6202393906420022, + "acc_norm_stderr": 0.01132348350471584 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-08-31_3shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-08-31_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..6507e5c1dacc4734561378b98ec5cbd5eedce9fe --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_3_lm-eval_global_step52452_2023-02-09-23-08-31_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087967 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3218559218559219 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.29286994622585144, + "acc_stderr": 0.004541492151639243, + "acc_norm": 0.3227444732125075, + "acc_norm_stderr": 0.004665704208339039 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.4925019731649566, + "acc_stderr": 0.01405090552122858 + }, + "storycloze_2016": { + "acc": 0.5729556386958845, + "acc_stderr": 0.01143868739857839 + }, + "boolq": { + "acc": 0.4675840978593272, + "acc_stderr": 0.008726657178723137 + }, + "arc_easy": { + "acc": 0.42297979797979796, + "acc_stderr": 0.010137328382209099, + "acc_norm": 0.3808922558922559, + "acc_norm_stderr": 0.009964428212260379 + }, + "arc_challenge": { + "acc": 0.19197952218430034, + "acc_stderr": 0.011509598906598098, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.0122078399954073 + }, + "sciq": { + "acc": 0.72, + "acc_stderr": 0.014205696104091496, + "acc_norm": 0.679, + "acc_norm_stderr": 0.014770821817934645 + }, + "piqa": { + "acc": 0.6273122959738846, + "acc_stderr": 0.011281318332897734, + "acc_norm": 0.6202393906420022, + "acc_norm_stderr": 0.01132348350471584 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json new file mode 100644 index 0000000000000000000000000000000000000000..cc97b2635f05f68bf297aa6be8eedfad2f5173c6 --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.015050266127564446 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681817 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.61, + "acc_stderr": 0.04902071300001975 + }, + "hellaswag": { + "acc": 0.2954590718980283, + "acc_stderr": 0.004553164013379555, + "acc_norm": 0.32443736307508464, + "acc_norm_stderr": 0.004672074496749016 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.4846093133385951, + "acc_stderr": 0.014045826789783656 + }, + "storycloze_2016": { + "acc": 0.5734901122394441, + "acc_stderr": 0.011436857656268697 + }, + "boolq": { + "acc": 0.44587155963302755, + "acc_stderr": 0.008693659886486845 + }, + "arc_easy": { + "acc": 0.42634680134680136, + "acc_stderr": 0.010147858603835144, + "acc_norm": 0.39057239057239057, + "acc_norm_stderr": 0.010011059112064239 + }, + "arc_challenge": { + "acc": 0.19539249146757678, + "acc_stderr": 0.011586907189952911, + "acc_norm": 0.23037542662116042, + "acc_norm_stderr": 0.012304928418747611 + }, + "sciq": { + "acc": 0.718, + "acc_stderr": 0.014236526215291334, + "acc_norm": 0.687, + "acc_norm_stderr": 0.014671272822977883 + }, + "piqa": { + "acc": 0.6289445048966268, + "acc_stderr": 0.011271222398600525, + "acc_norm": 0.6218715995647442, + "acc_norm_stderr": 0.011313980666854535 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-08-31_4shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-08-31_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..cc97b2635f05f68bf297aa6be8eedfad2f5173c6 --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_4_lm-eval_global_step52452_2023-02-09-23-08-31_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.015050266127564446 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681817 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644645, + "f1": 0.3362023995826813 + }, + "copa": { + "acc": 0.61, + "acc_stderr": 0.04902071300001975 + }, + "hellaswag": { + "acc": 0.2954590718980283, + "acc_stderr": 0.004553164013379555, + "acc_norm": 0.32443736307508464, + "acc_norm_stderr": 0.004672074496749016 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.4846093133385951, + "acc_stderr": 0.014045826789783656 + }, + "storycloze_2016": { + "acc": 0.5734901122394441, + "acc_stderr": 0.011436857656268697 + }, + "boolq": { + "acc": 0.44587155963302755, + "acc_stderr": 0.008693659886486845 + }, + "arc_easy": { + "acc": 0.42634680134680136, + "acc_stderr": 0.010147858603835144, + "acc_norm": 0.39057239057239057, + "acc_norm_stderr": 0.010011059112064239 + }, + "arc_challenge": { + "acc": 0.19539249146757678, + "acc_stderr": 0.011586907189952911, + "acc_norm": 0.23037542662116042, + "acc_norm_stderr": 0.012304928418747611 + }, + "sciq": { + "acc": 0.718, + "acc_stderr": 0.014236526215291334, + "acc_norm": 0.687, + "acc_norm_stderr": 0.014671272822977883 + }, + "piqa": { + "acc": 0.6289445048966268, + "acc_stderr": 0.011271222398600525, + "acc_norm": 0.6218715995647442, + "acc_norm_stderr": 0.011313980666854535 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json new file mode 100644 index 0000000000000000000000000000000000000000..bddff52eee525375b12d0c95246242da0c611395 --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.37, + "acc_stderr": 0.015275252316519362 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402706 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454878 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3464373464373464 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2952599083847839, + "acc_stderr": 0.004552272447071696, + "acc_norm": 0.32374029077872934, + "acc_norm_stderr": 0.004669459891917693 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5740245857830037, + "acc_stderr": 0.0114350142621812 + }, + "boolq": { + "acc": 0.44250764525993885, + "acc_stderr": 0.00868705131518137 + }, + "arc_easy": { + "acc": 0.4292929292929293, + "acc_stderr": 0.010156678075911097, + "acc_norm": 0.39604377104377103, + "acc_norm_stderr": 0.01003558096209795 + }, + "arc_challenge": { + "acc": 0.19112627986348124, + "acc_stderr": 0.011490055292778585, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.012207839995407305 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574885 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572343, + "acc_norm": 0.6147986942328618, + "acc_norm_stderr": 0.011354179751257073 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-08-31_5shots_backup.json b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-08-31_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..bddff52eee525375b12d0c95246242da0c611395 --- /dev/null +++ b/evaluation/rankeval_x_denoiser/checkpoints_2b855b55bc4ul2ndfixnew_5_lm-eval_global_step52452_2023-02-09-23-08-31_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.37, + "acc_stderr": 0.015275252316519362 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402706 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454878 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3464373464373464 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.048241815132442176 + }, + "hellaswag": { + "acc": 0.2952599083847839, + "acc_stderr": 0.004552272447071696, + "acc_norm": 0.32374029077872934, + "acc_norm_stderr": 0.004669459891917693 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976633 + }, + "winogrande": { + "acc": 0.5011838989739542, + "acc_stderr": 0.014052446290529012 + }, + "storycloze_2016": { + "acc": 0.5740245857830037, + "acc_stderr": 0.0114350142621812 + }, + "boolq": { + "acc": 0.44250764525993885, + "acc_stderr": 0.00868705131518137 + }, + "arc_easy": { + "acc": 0.4292929292929293, + "acc_stderr": 0.010156678075911097, + "acc_norm": 0.39604377104377103, + "acc_norm_stderr": 0.01003558096209795 + }, + "arc_challenge": { + "acc": 0.19112627986348124, + "acc_stderr": 0.011490055292778585, + "acc_norm": 0.22525597269624573, + "acc_norm_stderr": 0.012207839995407305 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481735, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574885 + }, + "piqa": { + "acc": 0.6305767138193689, + "acc_stderr": 0.011260988628572343, + "acc_norm": 0.6147986942328618, + "acc_norm_stderr": 0.011354179751257073 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ae8f649af1a4c76b0b8468bf2033b652dc5cf3b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ebdfc43423972a8601dc16d3596e4cb0897065713f4ac606681f2cdf8cb019b +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3becb9236899d9f5b69c34bcb713bd7c1740f12d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0784ac4153ef77e45afa5535f15493c21783ef4097c76af01e7147f924b64f00 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b74ba4e1e0a316a715fc986393c173dba050f8e --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8eed83613e3385df186cf830929463aa12d83e87feb3d4623d59578a54ca278 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f75cd439d80576f7eef19e976ff14377487a2b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8b69250a5892a05cde97177d9326ace782fa4fbf2c092b6c7396b88fd41b9b +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eee2ab24b1455c59ace348e8fd06400d71866e9 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9bee9ecda27d21a06aa2427b8c54ad8193af50e0b93e99c7c7ee06075cd0301 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68cc59e03995c5cd04c6760ab66e3cadeffd74c4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909fda18ca8578749081b357313b036ed20cf16c7eb084463e5d4a8f8833268f +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b3fd6ff9fa1a4bcfdd07dec05ac69c7a446a088 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d5126e9d4c75f64ee554c60efa47cb49be79779bedc4aaef204578d2de3d5f +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a11e2680bb20d11a3879239bc384fce6d0f8d2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca15da1918d159d6eb5fdedddece005c59f7a30f50b6573acff478a41178eee +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f32d98b03c0bc010018b9b22f6a3c64da828848 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf77a21df1d01d931cb67c2c93131aa677734ee68e12b1b420fdcfc06792e8c +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b83e610af19ca028a9ad11e74e678dd3083593e2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c0c8b563b7dfc0cfb8dea7b35d84c5211a51b6b41b80cc04e619bf2d0d72a8 +size 132046573 diff --git a/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ae8d8d1f752f4b05feb3df533931e296756d97 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da01fc66baac2e9eaf96ec65a577747492dd9e729fe23cb0004baf1cc4630c7 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1eb2d91b52308f0d342d4bded0bad48f1fe9d00 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe96ba5a5bf1c3ef8dc404c640d755e2497e51a3ac2f291fbfbcfbbb62bb0f5 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d6b39b132b734cf8ab9de5b3b13950c41b72ec --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111a04b8aef9d6e532cb9e8c97acad27a8afd18f7c6737766973eb0ae29a125b +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0632ea378177891d5b9527f3f5f3331a90e5d5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d899785c1e0f9cc34e944f7f9ec46c0f638eba2b9a461ec2c377025bb9eb7d +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c7753212fd6edbeb4b22159cbfba28bc330711e --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b841a9459d9aeb6f92e441d73d2d8bea8d9f134537764ab623e49a700e1ec92 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a626f372e689c3c4ab86c02a1703d755d3a7ae1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c9e3e7bf7deaff5c9bef33637ddabb2082a5e0af3ec5cdcf6c7b186b5151a3e +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cfbe4810ec1f0e83f8097911589aa5379525e3c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a2f2ff0034ef6cbfca87b1314ca2e848c3211d2de69edd4b3790196a1e3ae9 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f5811348556d60f9ef79fa0efc648e07ea51c2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5363764a7c98688309a8bd3f4b4acbaee44344532e2576c3a61f9a2cdf065a44 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a4be8a815d289708b2b21d69933fd93a0ea1287 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e87b0160c119d26d1c91ecdbf0b46525768f7b5b305e3e86258988fe7b7d2c +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fdff736c3d53ac2d84725293f861dea42e8bc87 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5d5586381d84bf031ce9eed3d9771fa6b524797bddbdfdc1f90009843c0979b +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57c46f5c6ea508faa704bb86a53dbf1cb5aeecd2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e87baab055fad043b022d2881937fe84e9504a93fe96c68ae0c9d910beff72b8 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6370036f3f8002245c122f7f2292aeb730ba6e89 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b436b2dd975ad41d9190cae7f441d0318b3f4a1cf258211bf90210be312050 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..338c67afbd6c5cf2de207dcee93251d590afa0a5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1089c5ade5e13a266cbc20b7709cf21de6b5912da3927ddc136f749c5870c0b +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a87af35c2e20caa3fdc4f82381ffada93524828a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:902cec4ef951e56c169461adac0d4cd5b337f3f1ea06a23aaf59752408c88533 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed978bf5ee53be90ae1702a00208da74341d1e94 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be2413509c0e323dacf12cdcb98581527a773a0a7e95ecf7cf7d60b31d9808cc +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e0f8b2aebb7f6eba0170560d3a74ca6533bc1c5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36e816d0187e7937d8c9983b0047a8d1b9fabe73d655d35dd8f1727ba96ec76 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..746a965752bfdd442504fd7d271b382e4bd01586 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9077a42b1d608e2166c3a20999dc5220044e41647ec00ba9ee36d50f518b7a30 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49eb4bc70195e2193bebe17b79bfdd53af5765e5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceff865f73dda8d1f09cb1c2e3f52da2ad2d94b02bcd289df8763aa5742f3391 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4256a244f9268922db5f42f1161132bb252ec3a5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a686d3b010f3c44d968fe83d1c91b91e8e1a770838ef1e7883e41878283d90 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..347723cb9aa44e98369cc5cebd901f9e41ba0b0f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8444190ecf254debe8f26b149b5626e31292b288fade99d7dd3a1c13b7bf55 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b17c6a93001bfed9f5fa35a63b045f111f67cf2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b132fd5db284a496a34e16847864c27e5ab458ef58d4a0eda832fdb487e3eb +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..357c5e23cd17916c33e12d44176f56a8eb8e97b9 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e42571df92853bbac7d8fd57acdcfface2963ee62d029a355e4acad9d649d8 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d9b325353e34187e613b0a689318a3a6bced9a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1554f98f2155e218c55ab296680f02618a9d646dfeb1128e0733499e4c1ebc3 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ee5a4d4950eaa154e25a92f7d3633757117159 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eac72a41a473b01d5e5efdda836d2412d925a6173021cc85be99095747d347a9 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc480a7df3999b2559e3457ede9e563f1a0ee29 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0a87a358efd2ec715e0e422c26b9f0fb6fc7ce4f7e112a3aedcbfce88b06c7 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7340ba6cdde2c7239a4a281cbb23a908de571f94 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e129e598988f7caf924847dab2b9845f22e8064a513278f924c1b81d5d75a6 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d44eb3d93cbc8c4fd4a2e5f0b8e3d2c56eda03 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5541d29ce9bee8a0a62bd6a17de811bc4d6e768ea215e9a6056acd412b4e73a4 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d0ff75dcc2a96cbac23f4afa0fdb8c44180bf29 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6fcba96950094db20922fc5554495378b141224e531fd13db3d879bd9ca4b4f +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0514c0148e2bfcd2870e5287dda12d775d089fd6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82d3dcf92b47c8208c478f48e5774bef850e8b2608fdaff1b0a735f66f560484 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c078a94a525909596f5093d8268dc800912abd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf665b7b11934f38ef436fb9a483e2301dac40acaeebef7277f3f7c473473cfa +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc91cb1f1ce7a8a1924bf21cfaf276eecb407fc8 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3352ee00269aaf47a928e4ab75366d3311a0b028dcea65b9e2b54ffbe435ba +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcfba7785c683d12771be4d6f2e698fc9c00811c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76483f8be1db8b65c30add6eef1c548a40e55a7f7c63dc8ef35d760e756b6b0c +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b5601da046d0ccae02afea54f64cb57ee2ff0a1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205f7c40627b8642634a5b3ac05ccb924128caefe32980b0052f3439f9a81fa7 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..583e1581f6caa175ddb9b2ea879b7c3d6330f304 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d739894449a46a3566a29261eb63c2bb539648071e6fd2954a793a49d18f4411 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79025e502d7bf72f78d5eaee02ef1c6112071db --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f542082294a2e340d1629f4061b1e45670e5d10f93c81a48becc8690c8520a +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9d607e663e309ed6e5a09cf1a92f1e1f6b7cf6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177a54b1ccf447deb21eb45c156c5d47669226a967e000c2eb9f70252770df01 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13efd5803c965badd3ed872a1056267f7e77ee65 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084d747c5cd19781e059c70b23b9b2c2c500ca394266976c27ae161d27c2bb1a +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7af35c26a2ed8e68168b45d2ab018a4efe2f1bfa --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6930ca017dae9b9e3fab5d4fb0c51deab1d6329af3ed6fee2e1d3484136537 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8b90d9baad64c4649e87b21e577e31fe3e9813 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7a613deb9b045f9efb9ec105ce4fda328ed9202826029643c6b9f94e4a0b50 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caceaa21ede37a02481b65aa41c724295e070d7c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3898db0c9ab50bf41891931187cca3f02a791528fffc9fabc792fd1c4ef80728 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2500bd3d2cf0c9c74a13404917fd9ac23fac4936 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5cbecb5218fc3e5ae441538847a419e02b82bb23080c59e1f8b12531dbe6b1e +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d83e82114e314f17a63034da086eccfcdd0e3f2c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e00b853ecc7d5e8db85ca33b6b1c0e2dc3fd3e3d2063e6a894a40f348f0da066 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dc879d5039961138d8b2b260d2ee79bcf244752 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b792ca71252dd96943c9ad95cdae20a27ef51c730468631b1654e446f4207fbe +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc17a2ca63a2bff0511504b0e93fd8425e56bec6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b296852e710368ca773f968416a23c6e4c690440a02b9049a152358b13855d5 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8505a34004023882c035c76fb9cd802e887f9be --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f1cbb61a5eaae2f4a738368ac6a420fbdd8ffe51448dae5a3b2d8259db8a7e4 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5a77ba00626662c9857aa61ea89358c0ae2acce --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30bc445ed221ade41b863724031e23ed5de238b5449a9d8b3df91a9c27ecb8b +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05bbe26c0d2dae502574c1c9a012e0ad92f81535 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a3bcb26a2efeefba982e6081508e2ba12a8becde41a0a7cced44cf18b0db33 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e489c33fbb01b2e571d72292e9e61b03f77abd3 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f87840d29c470544e7624e372b0b0f69d4f4a975544119bf48eaaa19dd3877 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1910dbbab891a445c244e46a610fd511878c685 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a4160958428c188cde72746c8faae589ca34195d782ca927e5752ac350cb85 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c7ccb2c036d86c537877cfbc2272fc8ed6199c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbed5188abc7883e908e33e5779d4e4dededffa73798380f795f55b356ef155b +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..955a52bdf4cb695b819fbd75401c90be4c746fdf --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0f8b8474421aaa4582dcf5f4f58bf0e5c9a22af4aafe1aa506e13861d8fa67 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e625f0442bbd453ea1b191374852d908169b9c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee2d1992776e063a3a97c6a8aa77835d03683823549904a1970ae924673dddb +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..937ba474a945a250932db1bdb3b3ccfe2fd3ad23 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f71153d6ec05ca04fb384420b06810d0cec55feb8e0f347e3f66abfd9cc598 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e210219cff884bc14a5fe4ae06fa7ee1a1c40d2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41b5272bdeb5b9783443d91a3f7952ad53f901267ed7f6b4d76416bcc8bbdce8 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81768c327c9e4d2a38376ea4dc8346b3ed8e9428 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e2bc42d05a93eb60c917b3bd0729ed47c8bb2c75fef87792892757d8738780 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d5b03c5821e761833b0a558dbd33bbdb14e62cf --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1aa20e2501787f6c891ae95ee80bd8a523a59901830f6f267984626b4d2554 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0826be1ec4edc9e8b7fae9e4626ea614536e02e1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c365f364fcdf5939c0a0c00f5b1b229d8537fd2c0ca0754c58e4883cc990f7 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7a8ebc7bcfec6ab96451add7c82baaf49f52072 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f750b21493b3cd453f058707ab5c78bf99af7e40a8eefea8741a199c53445c4c +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..695b7eb5458097be41a604788570c9a654119343 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c848bffe39fd24a7870bfc5bff1b15a6d233deb5383bfab886f85574126cd58b +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4310a5712c81e2aa4c86085750ec3069cd091d7 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8d458c8de3a4b28c399a4a6cdf51e4ddace6b042fa439ab753ac709d531ea4 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25fa25ddbe197ab55026bd3db4fcebc2247228b2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4849bfd0eb98ea9752042d18199c27508fc09f12bdf5206af5ca5dbc17d917a9 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69819a58b91131361bb268104169b0b1683abeb9 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618ee28bc03da23721020f8e8fede5c574d523524488f9c55cb70f72336b852c +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce391dc1136f82a740b3e01f6ab733f1723149b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2a52fb48239fac71a17ef76d867a50de94e39fa8fa2996eb8ae547abe8636bd +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..892cc9181a1c33ccd784b31bb5b895b67656e956 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6299c79dcc06f49d8874e8602184a629b11e56edf1ebd0f6323e22bee6be454e +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ebdf6cff4d8e24d7872bb36263a1821ea5f797 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39f32c7db52288e67641a52ab41cc366581a5d840b6ef98a4d5ef7153b1cb88 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db33dff2e5f55af91252ccdb5e912719b6b33f60 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8d4da3b7d1e607c3ccf56707ad82b63aca9255e36ce1c45106e9cc993442de2 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b28e59a035a89d08dbd3f21a3768adfa3323fd23 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22743e158b22ddb62df5cb260368a29b48a915085f726a3af75fa16c00972a9f +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..852ee218b72646f8b5a017529e3c4bb4a9768c53 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:041a429c37af2bced64ebaea2a2bd57d7d20b62f6b744e9b106066f26c907c41 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..515d0989fc216e2be5372e444fd089b2f2a2028f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f73bc498f8e05528f538d7697fb0d492c1ed47bb44383d873c73120c11e732c0 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9bac60efeb20f8608840b5b78bd728396f47e4b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf88189354dfc9898256d4f8e704f89ccd2d0ab282a7188cc1a90939f514e864 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae340aba96939f27ad3907c95a5ba028f8a3761b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078f51868399cd3bf9f1992cd7c4f37fb8d9a73db0b6ae1175ef50176f2fe13d +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3e15a45960f27bd4127eaca443582e6f5d4abd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b42b79d95ce6cf9daf2742a917909387377fda6d61ac42c5a212e7770f5798d +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b49e860bc41ddb08c4f94d49999e954ce3f9390d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb64adae96779ec3e8f500e230ae911cf0b6c794b58b7734464f729550646df +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc109026d16cc0a3f659ec9f832ed8f5043f966d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b97898fdcfb2f8027ba055023c3de216e775c339c2bd7436abcf52c1a107b1e3 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8fcce04cd162c969b441d3c9741e875c1d2bbf3 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d408acdb8498219665b63d6d8fbb7a89ce0307c185e5dce93c12ea6025094b +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a624204139c6bd70444c46d9331a5a6917aada7 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef0dbf06e7583c31826d63c2d88544f5e69e529b711a79620762a61f7bf76bbc +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41e908d8863dad18e9856c151fc38b10b7ea6ac --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d53024857cf66aff5fbe32cd0be7a6ae2583af5b93514f3b59dc27a72d21d95 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b6de5a7d2d7977a3cd25d613f5b38b54b57e9d4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad9ecce336d1a54b63198de5434129265930bfa129736e3b8a42a77a4d2d516 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8a6440bfde3c8209cbecad8a4500e600ead4f2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6087a2e8b84b010116ae489dee71101576a724a8493068482e26f67306861a +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb30748a0f8d476dd8c7e6f9000115dd62928bc --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8fa2c9754bc605e70a1e3f3eebcd793a5af415d7ddb3aab5d1c8b3e8bcaefd8 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f2513c96b4f1b967de6d9e80c8a75c8e09eaafb --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e112757badf32409317eb7518c305996355557a117e40d2b37eeb952d4fc93 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12dbad6ad873bc75f6faed12f24faca64af5c393 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0490d6b6d4360974351c50ac914fd04d0fba4a83a66869d673563ba2d2cf7125 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7ce2f64d699028de9777262c0bcc3c1103bde3b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca983a9b38b033ce43b4adda3f946a6ec20a2b2150917ccd6c78deb47166f19 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65ac5a1455548c798d6c98abefedcedd77adf4c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56967873975538dc513dcf8c880f57da5cd6363bebd0af6050d58fd3e9d3e7e0 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ac10bb32cfe58e2506f5ccb15cd1480473d2e72 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4ea242563991d0a9da6ae234b1ddddb1bb451c7ffd133448722b5e697ce906 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db365432f589516f8b6fe908d81b4fb2d1415e9e --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9473b4693debec95448c81549ecc24a7cfca563db9cb8f6a6a14c9d434457ad3 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4473ae2cd88f3e71f6125cc7d23fcbfbbc0e6ed4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53e8d4bfc5765f67cb2c41e3093c04ffd33255d31d65f8aef06104672280751 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd4bfd1cdb5233ce6e7c61d05867dace2b2e5c4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984aca79e96d7020c1597afc9229a1422e5e24787ff85ed1be580a4964db770e +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..315629868dda934a8f0bc2cd9118275647026768 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe6fdaf7cb1a1ece4da3000f7df54ec1dd5144a6d600f7aa31ac379fe288fbc +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9528b91e733e94485ac42aa4a92db2c2435c442 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b832d20c59d185ba9a46b6c4dddcb1c72a7bdfef2078ef4957425906b51bcf94 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8877b98697cb4ff001a4c0b80f3de6393473042a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f22ff0c7d45855ba897073ace26d79a668411a05451b167d84a6e7202389eb +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7104c5d8ad5431ad8efc2d2cce9744c8a505752 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfff793ea9b2d143e7f112a533e4ea47989bb3fe7e67b0499dc7960b4acaeef +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eaf3cc54654c01b96ed4c3a12249b22177264f2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9644e6aae6455e6bc9e4d30ae799047cc71846a72e34a2558d2df104ac058b7 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6411d03237e15ff9b800e672fcb455c3f4f747d7 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0978da441c4bf21f106db97990cec9d8f0c993f9ded2a2c15b97f95c746ad9 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa0f5bff43db6414787a65d22982e994c57a0bac --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ba240317233dbe541a0b438300f842d11271c1976af40081ce3e80a1042c71 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0193f2410dd1204691b41ac4211e4e23a3e80b1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d38c3fe2d645c5979dc27cac21fd50ae48729303eba5abd3e7d7e003435f75 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3270209a258dfcce75be0e5762dd4a79cd0e17b9 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d646c7c45eafa095f6b951270c98c7ae5215a92fa9512876fc4dc8311bd697a0 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5daff575e36abac7e3ac8b529b4d23ffc1c667d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d917d567be76a8e277ce983d2b0ead6f068b2ebeaeaf99de62ab9cbd1c6b00 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eae533d43393a5744292d94e94d78e536c79eba --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b102cf4f567fba872e49ee288b280f99670774fb1fe0ecbcf1e41d98e6525f2 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83ac0f3e113845dcace418bb62dec437e955f11 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a01681d8ffb947bdd648da31cf05ab04d00f68fc1fc9927eb4e03731f57314 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7053ab47af74e634bacc627f927010d643ac9776 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801b06d0a91f303502b641786314540298f7468f3f4de5d510b5bf8d2ec0ba2e +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8b9f3c87188e34c217799717f09730d3f072cf8 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1595d711e4ae66f55b5d5bca09f40974a5018490644ec7538691a64e0eec34f5 +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd31f1f1a4acd6ce39ed098cad6414101753fbb1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82bc5cae06d2abd384841414efb1a6b285bac72a9c969b9d66dd10873b9d306c +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c42c19c686ef5df41ff86bf6a136052392ced714 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e480170dbefcb229001e45dc3738299d6cd8436c47777a4c29cbdfc76863f2b +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ed7f8406b2122cbab3dd3df719608bdc940816 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2dd820a38914e2c151568969bf3ef221cd2473ecaad12d59a6f2b34eda77250 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3858f4526bfca5c734e412db3d796c99403278b6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d67399a87a4941ebe9738b8045159c020218c506da5cada879177220c480cd +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c6da59e5a9a4050880508783717057ee9fda4fa --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2291598ae794fe9a453a4a89b60356f08657e5c1ed9807528fd618912a5cc68a +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82707e851e5827183abcb4ae0a4de665b82667e0 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced9b0cdd096cf3b1e31ab0bae6a8bf08d1c3b817cce1b62b3d124bea252274f +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d94457636dd758a9e969e9197beac9102ba6580b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d17ca511ef7c89bc80d2cf5d889b07c378878dbce3b9738b4f0dff5d82532be +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76511d871d64e4c4c04f0b8fd2e2154622572817 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1825e88206176d344508c11383829da2891370aced2b838378d37201777b812 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de4c53c87fa42751fb89ab0e7da255436d01e25 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af25df853d213008a5d4b78f358c18364a207e4198de057ff5d02e44aeaf603e +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0989f55e2fbd5be4750cde1a903ec066315bd13c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43c3c56b1fa438469dff1cb96686ade279530509eb632cf434000cea586ec23a +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d2d5872c58f8193170d6fd5c9a1ebc0724544db --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b84b6ccc58ff6636277e5f730d43bbee79c644300023ac62567932622af0675 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb8ffd31e87139d4ca28d0a113734dea475e7fe --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef1f7393175191fe6fa688a2a0734e4dc0e74b491236094804a838d2ffa23b51 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffe21721c8d6ce9124fb0ce9c961d87a271c6faf --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a40a1a4d5d27dd2c3dd900bfd8d2738acd096bcf3b8de2c411ab5d59ce8ffd +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a40f3a6de416200cb36eb790b72dda459a69cf6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d098b41f74b69bccb5ed317232590f7856be86684158e7343d0a532f3d7b15b3 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..276cb138ea889351ce17d234ea6c2395a6e18bbd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a44dc67597a7f121b5e9433305790f2210f86ae5ff67d79910921b3e47d9b4 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b7cf34d416e4aad026c81ec21cc18517e49d13 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9438203e8835b6a32ce7bdae92fe426dd44501529955c04d23537358ea9b02e +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb1a28e5f2731858e1255e9135dbe25fe3b4248c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17540554b9fb09e0ea975ed21118aa9835b0c74afdd892cd31ed52a6e31f8f5 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7c8ad311809786e94bb6b6df1fcb016a86e196 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99670651e67e1405bd386b3b2d4a009984bc5b114b3442c3efc9badee5d04f99 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f627795117c0f089b6e5440a8d9cb2395cb7482f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a3e373c6a2b712183180daccf920b299e71103694f57163e36aae20076ff9b +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..803678e692c1f641b2c8c3e7c8d812b1ce91767c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae8ba80642fafcd05dff76baf75b0ce9f4121b65cb9c8d0fd6271ae49871d11 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62aebf4eb5e2576ab560722d5b70b1a9e7d4644d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0af7c494e084f41aa721810805596cab2b672de5922b6eb386cce969155bcca +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be52417e082e0c3588a8d077a2e27938164efeba --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a7df9f94e77a29cb3bdbdc4024a034deb90db88c0f90cf7cfbb703cf1393e78 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b87d34fc6b144ec5876e6183fdc995d1b73844d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161ee0a55b12f528a66b15f0d270773f6c202ca849196b4b29ec40707f47adf5 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d85d4b1a8ccb76ab76fe9eb7ae731c0656bc963 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d547deb1d8a3309fbae5b6edce7744ca974a1afda31d84627afcd0641e2bda4 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9d709da94764edf0e3896633a1ccf59940e7a5d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b43b6aaa720ba796b0760e39e2c9d42476f161f057a21df001a028613f3fe25 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..992d60dca65e5a8a50c51fef5c054f18b262779e --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abdcec65599bfa213399feb60f33737294d8fa42bb8bb0138c6218aebb2c6c7 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e082bdeaf34e8e971e75f745ee9bd2114addc008 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f71280f1398cc62de95d52e8f376d98ee10b1efe83c4ef55de5eca1ae66b24e0 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c026f21b113db4d4c54c3930a897c7fdf5275cb --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d3a265ea1c692ebdd37a2584e23cd452eb6f3cf3fb84466af285efd4786d81 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c7a5c1d64837a5e5458fdf98da550fd628a2a8 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1919d47c449041e2a7877790eacc3592728441f5ef3186cb703df7e80223ca0d +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4148bf427ed707b60913820893a09b32b536153 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87f2a7b737770b1b31cd1a474bf7224b620e3c7554bbc07869b1e1ef5fc2eb6 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf52befcb73161c31bc8f349b5ef2b4cf4aeda2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4894dd80ed5399414950345cd476bf3bca0420453ccdcf69053d2bc6722c5c +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..659183d806fe357bc8a5e9c430c7f93079cc7368 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086097049fce81755f80732259c54ac5ba1519bb24f29b168f31532c146a720c +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58f511f18ba4cdc4c4de7cea4361ab230627f867 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7e21fee9259242a1ea2a77543dd824875238f32d51b3738ab56c3f3a4b0533 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b100760086b9dd7359a340ed01f7c80ba068fc03 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b577ce7c5b7a72df1065eb246163ab276094d5f0610702dcd2ea97ad5bb64e09 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09fa89763914f5f8ff96a7ec5d6c016f70a50ef2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ee198d4edd4d2426d781e7834ecd5626dfaee909cf21797e34e5b579d7f672 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6725a14c38e7962120986ff4a96a73a5b8a993b5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad3df88e3e9ccbfa17b28d3813a326f36f0fc5057d440210136f48ce52e2fe3 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64de1561073a42e0ca57743065c015e97caf6c0f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21326df042e76d49c3c6e9ee6c347cee63cf79cee807b5a1ed8804667c4942a9 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dc435c3985bf593e6f952041f2c2f99abde2962 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3c8fdb1efbeec95e5b72527ce0686d99f6da77260a58b88d67b22f93f5ab3a +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e5e189b57e3cb7b75122443cc3937e25796e3fa --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5069dcf53380f2896b15634558099e3dfea3d0bc477f3c2a79c23c257ebb46b8 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b5b01b2f310593d149ab9afb6179e90e68c9ac --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d386d20ca032feaa52cbe9dce28da2ec3cc0c2c06016ebb83da757985a92b900 +size 132046573 diff --git a/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf3fea482a86d91b22bbd61f3ac067e1fc53398 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7b8bfb25cb52d8f1cd5b5940032bd14f851cb7f3e7cb30e3d5f5b2d96c36742 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f7a838ca049d27ac7485d0e892ed6912c99439 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b258abb993563283251046b096c0e1f5e7771a571eda25a89426822b7ef850b +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3add508ac2d6b192d802bbd7401de5ce08834c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1baa3e66c175385dbab9ba4338ab66fd8f98e57e0bc5ff50141716acb891ee8 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e42946717edfca9e73a69b9ebf7e05d1441cef --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114102c63b0909f0d8948ef03c1248410038005e9584c2f6c20fb22966e0c130 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aba102257cc0564ef162664d20c1599295f4c71 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f223fc75582aa2881e06f0acce6535f2a2026d45900472e97586eb0dcc9530a2 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe61b8432f0e714241a5e06578ef70923cccee40 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98fa93b10ae86ba6c1211ad376049b99a6c0fe1a2f079aa6cc5db038ca13199 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f965b912e531a9eb7d541ad78ae1000bfe2d0a5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c7d81bddd189259b4fc24dbe142f2d8a25f262e4f64034658be49415cccd9f +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e9ca63a36f8fd3612ac3348a28d423a5495359 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef47126fe8f48387580018e34d44168b1701d00b411d4c7b73302f0ee094038e +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..294eb898747d150f27b5d60798cd556da6442961 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a22929e3a5999ad522704353ddcb8af2dd2cbe47fe8b02d836b0893326c4b84 +size 132046445 diff --git a/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1348e398e3e40d3a62bb11c4fbe0bbedd8be9ca2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b395a33b642cdce3b96312917a4cb116e31fd02d27d09afc400c936797de1df +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0585694bf63a2b22025e3b51c68d405a2d95b3dd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c01df8d54c62e2c3bb9b6eaa5dfc469a2b4c753a0b2eada64cfebe913ae1f48 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..802bcc27aa4dd502c04f1867c2839bdc0d59ad32 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29891cdf28222c0237bd8c832a6f33df74cd8034f8a1834df45ff451616c8b1 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c67e9f10ab77791ae20bc412e7c04b3be066b3be --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:243bedf8fb82349b6d9a2e2b817b0276259ddce61e009c5cc270eddf8711a9c2 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fbe00e762374d0f20cde3a6db7ae2190238727d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3589a4d7cfc9157ad37d6ce2ffed4e8b2591a6207e19396d67330a37c4e65e00 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b364a9ff4cadfbd0dad15395631b1857a476ab93 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f033e4305231b7037f5409a9b4c91b504bd1c4791679bb51238027d345ba985f +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf93b1e3bc9b2dd02d5d7e05d33945d08f82974f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ccc6b1291dd41e442971d187dcd84bf0f3799442102c8f5a513e6822b8c079 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b358721532358f16409914c6ea3e9aaa058198c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090e37e6502771ffd46b0457e94113fa98b5fab876aca07b1b3938598027a3d4 +size 132046509 diff --git a/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0e4414141f0e4b1bd4e5d136911df8e8c0eb71 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341f98e16dfefee8eb546d161a0d709f3d454aa9695e18fb3d8d6ee94cc7b845 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad3d0602f9d91af6aef56006b853196c84adccc --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e9ecc5b2b08a9629f0ea0853859e441ba4b1f61221c5ddb7ffc23547f44cb6 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48a362d7c92751b02149502093032cf19cb2fa54 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f400dfd87be6511da665f31237386538d0dfd0d89f1b49ef4b50bd9ec0b00f1 +size 132046381 diff --git a/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..257a6de1732f2ecad87264c6f6ebb30c7ca00620 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee35160da1fdddb6dc01446c08a99c30ada41704a76c702256b10185025378c6 +size 132046317 diff --git a/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b364ec851760656e0fa86a081edbdf9e424de9a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e316b6accb482137b3d3a4fe80d1659ebe56ad687e295ef767ca5d660c4391a +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8dec52d5c1327257e61ea195c9e263913a5181f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3690dbf5dd136f6016bd66e4483c3d3d773427866c5060d534ff5ef9385110 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9dddab99bec1ba6ed6095fb7363a5c9a18e03c --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c169a07f4411ab9e404b2373857557a660cea3f164041384de4cfb0e1ccdcc97 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cd17a5d977a7810d285aaae009b18efd6f2560b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042e1202e60ba03a3b38d191ef2e3b89020f6cee665c3e881de4726da1516608 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef0067e13963aa5cf53c64554907a1cd3bbe387 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d656ed15fee2679b32f85f3de751cb9dcaec34f79045c834dc81d02874ba04bb +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76dfc43f548c19af38e9d476df3a071bb413d269 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600f9ec31343db0df3689ef9b8ed3f34ae64c5114da76f2fa18b98a7b5d7e185 +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c52bcaa41d89c110b5ed32f0a895342bd59996 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0097dab7f2862e3151f5e364e1ff4c5f37d9a2be4a58b5f70fc358e549191f5 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac728e9b93359263eb02d0f53303ae56b18c3fea --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34db4dcb4acd2600b52a19e61ef0b6746af2735307071e7e03a9c6b1a614cd7c +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54259b9e71c3d33cf371b871313e0d604db9d3ec --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7052bfe5dac540632735f24cb5c56bb33d55815cecf9e29d96bff5f86a76bf3 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87368fb096eae484e7ef0eda50a0b6ba1b1c29bf --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b552630c224aa9292967ed3995d3890064aa3b74d348d28df61dcf5ebcc5b420 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1e75bd265845d6e257f87f75eefc93c67958a81 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692b0b9c927de56dc4e2f98838af6e50ed9e00c8f2478e5568de958b2875868d +size 132046562 diff --git a/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ece01e80c9a4ebbd8e392da251051fcc2c51a94 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25f7ef1ba82966aaec8e9b57fcbeb0d8065e3a93534934d82de442940cc5c6a +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..719f5a800cc2ea72ec21ecf3d9d6324f63a9482b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04696870f6ab2882c93a202f9f7b43d4c351697114a6f5c79af4201d1e7ab44 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd65b1cece0394d9e06cb7481a5208806a9f5bae --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f019edb5fabc321d5953b242cf1f0148b4e735cb52eb4b694d51e45d0f41c0 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43444bb2b65f09d23d41e45533872c1d0a44ec94 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c828461c728e2f0db3e4d98faaf66c7baabaf3379d63e528dc93ba2dbfa02c35 +size 132046562 diff --git a/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4483b6296da85485befb3eb5dd5bb4bb297a48f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4142e2ef27d75203389f43b4c0a32417e4b525b3f05b7ee23c5b69e29e488cc +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5a9b92048a8ba8fa2ae0eed1e099359eeb8ecc --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50cb705df23d00723137f7bcd63ef3bbc592417dd5479a1517a3f710040cb74b +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd2a04204b707265085a1975de3dca40d83296d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70aef96185547fcbc119f6253b949c15363758ad19000a312b99dc0a62251c01 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d518c6f5f12f4f9e3f6c2e9797586ec3f6034d5 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d9c661478d2f67cad395a8bee113ee41980a11e4eaf20f3312719c7c070281 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..664a36f039656779ac3226872c8403863a17bba1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ed3a61b1a6c43fe970c5e8723c6127e9fe8b0572231b478bda99a83599de0f +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6632096399452f386b5b40e17249769bbee66f0 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9955309b576260246923f4e12a4fda6a58a6c5459544daae82424a69fea6cf2 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e9578a45f7eb1e42cbad878f5c8067edb696c0 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0dcd9d349459f92c76d6bc02659adfc88dc8c98f2a0982cc503190b146e621 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74e378e33b4b03e1d70c71742094203ae2fa7a26 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:562c8298027fc0676bd399715da799db3f14147f036ed3ce714a6db1177596c7 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c882455764e87646065af8a7994ceff6684c52 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32af03477f7ab408721cfe4b97ed59e7b92de129ea250773c671f5feec08765 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da16b90064c55e8568d4cdd7e06eed12310d6661 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455a09beff15fdd80fd8e6c73f607349903b46853973ee1e629109729ba65bdb +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5667ce3aa092b60078a4406ae20af5ac82ccecff --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4598f8b1507df7476d3685b9361135c098662d57fa5bb8e7e95c95eb556a0e8 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edc9dd2072334a949a591d0ba81a89e1c56e9f4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca36505bf4d7216f6901a25c91d62be4b1c487d8ee90945604880929c61ed42d +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e8d4dfb1bbbfaeaff58c73f77e33b3ec9405bf1 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64dad88b9e97d50a88adf4227683b604a1488937e1da4b243c0efcf0dc70990c +size 132046487 diff --git a/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33915835afeb46fa7994fae7d2761783e9e1c877 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:213b1036f666b80156bcf8e3338fa12cb2060615e6a1bd25c3513ff19679191e +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e79c6074328256fa75a813f5fd6cb9b923fa6a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509226d1121c8c26f91fede7393dd4db538dcd032892e650065ed6eb12447d91 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..018f005dec7755960be6e11c5bb1e27a76a270dd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21666f59b0b77cc382b327a6d206c0de1b33f76fcf8dcd9a0f85b61b7d4c44ec +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9864d3ec0e6fee9c8ef17a34bd50e2521e82faf --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54eeff7ecf008600bb2a191f51742a9dd12143a72883ab2094838a318b3e0f46 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c442d77240a90d21a81eecbb05c17a9d1b4b1196 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c688e6a7e6bc637298f2d11ccfc49a917c31b392a7057c044d9076ec7dd10278 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04868420904fa00f9ae444dfbf739c4039529eab --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9923be9905311feb5234466102dd46e8a90a5a1453ffd6b46aa28f39abea1768 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb298dc090d5c057b319d20bf9dd3fd93a1c77da --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55829aeba93dac7484550c954c4c60f24c92e3ad3dc3d336fe93ab0b8a84f4b +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aa59bb86756437452f00469f8107f62a45d8d73 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17bbb43fe86646595ff37cb87359a491b5bc77e8e15d8163abbb654858cbaf0 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ba89b476b3081fc95377c7b8c5e021fc0f6edb7 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4a42c6097fcf40b6622bbb8600f2b0c0794837756ebb91e750bec8ac58263a +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c86d47bd8499c27451f412d45d5e3b6e07cc8f8 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ef8b9423d57ae818b5a30c2f4318219de5606b5c50cb34d65decc1ac5e0b91 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a87ebd0b2660154b98c3c617bed3e451b1a3beec --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ee420303e6b54da7c32dfb0ceeef5098e8af73d0ad244dda3294418c1085f +size 132046295 diff --git a/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc4448f07e7fd708d7a0ace877a0782665ff1b3 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f97b24c73591fe0c1423c4dfc3d54e1a2a244a6e494ca1402277684856178031 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2617175fcefc3b5e92638e0c005736afb1a4494d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2375358a84d29fdf6e8172e87dda90be53a113427ac555415dbf4eeff0b9d40c +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96ee73078580a2fbc262b0c3ef9da2c1833f9e7 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4ab15786dd8e5c1c84ee2005637851f48f3bf7871063e77ce55970f69492d7 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a1790aaa8be65dff591c870e4cbd544f9ff59c4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd0b5c0fc8f8887a94ac7a833dc3c5ed8a8f6805bd4c0c9fef07ec4086498b5 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f13e47e6ec19258cde78ea93a4d7175881bb73b8 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eba8fabcb8d3a14b5d8797b101c9e32abfa3bbf888e50c6f454f451309e32814 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9576cff98eea2f891e0c3e53e645e2263f414e77 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65a02079a1e85d79507ebdf9132996eef1db5e03a54f12f3e7553dec620344e5 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8706200b7fe41341d63b268e591c56c4cbb841d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853b087b1e7f91a47d32fb36b10e8aeac2cee3ecee1fc0e6fc26ff73a725002d +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e62dd30412fa311283c284b4a4f652c21c6e3b88 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51195e9fb22183c3b2b48ebb34afe9b87cc0915898fd6c012a4aa23bdf7ebdb5 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b9e2e60ccf1b5451ccefe702f796c6c9ba15b2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ba1a0b01bb485442d558ce457bce230b2acb31d8b73ff97650f75e98610267 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9bee69afd02d60e2a093b24e20cc8972a98040f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce9090b89e6550946cc86f914ca5496d5fd78cf8d8c7db57b9a99afe1b446db8 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbea4e24a461fcbfbb731d8bff3633c4380ae77b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89bf24bd7e9713d29432d96377231b089e1a3b4010bd880b3243c4cad9ab1b29 +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cac648b40fd2082065b0b7df426ea7cb30f3241 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433bee52212047f57da80acf20dfe87fe7c0f85c3bc964e931058a104f493850 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4b43f66a038caba7e55a95baa6e146c55445767 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b6b1b7c093d1285f251f730fb765defb13e41ecffd1258479b97ac7a2381a2 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..680aa6c3a74baa955fe097b08efd5df1de13163a --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39fa210afc7b29062fb790f5de2c20180fba33935e72079f55c3de00e7ed9ac +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d756f5fa6ca995b740de41ccf0dcbf4581a87589 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ca55a64831a0033fe3f32c60ba0f4af5661be57a4322700b6ea732ca2fb4a7 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c420a081cbc2518ee1dfec9a2f4fb537584645d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e0bac1c955913e9c37b83336a0476ed7b793ffb203d7058c93577c774f5517 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44ed4e7b05a534d7e8064a58336a918e0a8f2b88 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ee862c605c21a7f88f98e073699b942f4ebfb125a8535c1a14e8e2e89a0d45 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adfe2d1fcb6b7367aa7d69b37ddd1ba640864985 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291a40abce8cea1f1bffa159576e9c2b582dc9468839ee0f234754eb4001d011 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd3f2848d6873d26b750f0e9298a9f04df3226b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb93081ed9d771ce38e1ce6a8ba1aa7cfc803952902ffe80df6d474a9248458 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1fc095c631656bdedf9c0746b499416dbeafecd --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce71b8086605afff23d9cfb658f9ae566fac9a62f1c2fc4f5360d08c3f2cf27b +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df21810e0122369daee494b74694446d25881b91 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee2783f830f3f0a1a306afa63efd405f741ba56652f09bfcdbddbc3707b456c +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c63ee3ecf490b45ac855922d007ba31edc0417d --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3010fb937c5a899476c1c3ed9d80c7eb93488b56389191ffe0ba2d47f6102b0 +size 132046359 diff --git a/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eacc439a4b36a255397947d43f670f6bb1b05826 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f351affc2e959b3d999833a0a7f5a704bf11c6744c5b85a964e76f345ea44d9 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a7379ea50dbf0be3d7fbb43cf55ac52327dedc --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f79651b1eac2b8c332ce7901f064dcf14aa2c08aa2fd268f022459bf7ec3cf27 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b389124c2b17030b0edc8bcb733a52255ce2f40b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88ed5e8253044d767f8e063bfa6a51380ab6d5ef64d8fc665f9cdc3b901cc16 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..237c96a942fa2bc3fb91316a311cf07ae923829f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5240af31de0f48a0bcb9e7b5f2d71a4682e7e43ad4c31e743ddc45be5ac8ecb +size 132046562 diff --git a/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0db25247fafa760138adb6aecb403b22e68201f2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ad0a55fd5da67c023308989aafc6a2284d035d5d6a10368caef66da6afe740 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b7dda2c267f73213b84da5acab1aa01e66fb598 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54bc74abb34be471887ac64f9e55d583b1351b400b96ef297653327be7035dcd +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..651c2193fa2e060370699de521db58959222b06b --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068caba576968521f89f83c56857aee7ae581fcf56e5425775255b342816cffb +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d8b37d021503bf58cd6f9229aab06f38a96a79 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565be0290e6c88ce7ed9b9df8ee5f8e6a14be4c70228d9c288f46854f13f9daa +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..936a7cc0315b3885c8431b66e9169e50d51389b3 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45e4780895545a0d09a7e6a1493d4c6659f4d6f636d525f9d0140ee7259eabe +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5444e005e4b52da8de571d346c06875f815768 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bce2d9f84c52be59f981ceceaf0e62c1e4700e899c2da7f6f1fa20a159ea00d +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe267ccb26566e6cdb1a1ce6ea4b7b836ebd5388 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d53edb3d88df2be910fc4db4533c2257d04fef13abba6b851e5e3d6e2d47dc +size 132046487 diff --git a/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..701e5a94c3a8ba8bb561b8f533599b7d879634d6 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3912626e3154f7ac260c069b9629e59a7f50fd2f674da868b32581e5314b3135 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..329b786ac7d4b0eba4ac1ac0a512064b09d43c7e --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac5a29231add0a36c5f49224d49c5794ec377945814c45ef172f01a5669514c +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c7ccc87fc2332640934a12b96c331010cb83d2 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09826af7464cd3d07f1b15c7cea78d1406993f0f24ad98e46c0079b39f45bc75 +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bfc908ce9db4d7243bc80eb8a5d4593492014d4 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd380ce8e8f8ee8fffc77b9eb5ad70b6030cf510803bb80ddcea7496501ec3a8 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4caca44bdbafa3aa4176fd5d71d7fd6acbc685a0 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d4574009786c1e94559ed9e7f6a23b47aa539fb44b205c2c61fc503209c6d2 +size 132046434 diff --git a/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9c50603148ef8094201ba22365c18fb76d8f75 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1814954a1fa0bb47a0620ab3258d2f3837a62ed6e8b0aa78a7c5b93528d8031c +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c8817fe607c74975035bc259d63f848b929282 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:147591d90a266a7105108c90f1000853017f44d8c05a2b8d043f70c354b5d0cd +size 132046370 diff --git a/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..002bc10310c5a85d78d51cf157a9028c41ff31ff --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35181f051d996139b607380f92947c3901a273daa62d59b98c051d256803024 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37d7349ab3faca3b646dbce71bd9d1467ad90b34 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f38f48aa437ab222e7fe00709711f5cc519d50e3023828186f93467eabe1e9 +size 132046498 diff --git a/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb53cb592646ed22f9074717b11850745723360f --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77acc21b535c381fc27078355f15c74497df1174495e1099256df2cd523491a9 +size 132046306 diff --git a/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0333ac1081c4c0ddeacdcc46e87c3bc4d4c295e9 --- /dev/null +++ b/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82797ecd95ddc2abf8511f6305323fbf5b25fa155666a023825fc9cb1918efd +size 132046359 diff --git a/global_step52452/layer_01-model_00-model_states.pt b/global_step52452/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b079d342c4e52e5d137a6ee32b7348ee3ec429f --- /dev/null +++ b/global_step52452/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d88828d3c8dbeb87728b677272037f307e08041d1d82aab25069f105ed9f97c +size 283772163 diff --git a/global_step52452/layer_03-model_00-model_states.pt b/global_step52452/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5d3428316edcb87a356f6b4f4c4c281840e523 --- /dev/null +++ b/global_step52452/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a6436d62b626690ee4b875df41ee74b9fef6ac38a5d5034dc2d6a59fd159da +size 157357315 diff --git a/global_step52452/layer_04-model_00-model_states.pt b/global_step52452/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5888afd06ee928983e0f1da3c4c8ec41cdcabdd1 --- /dev/null +++ b/global_step52452/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f763dcfba0cf4c08865489ea2a442dec7759e6b1584f99098d62c587ff58d3 +size 157357315 diff --git a/global_step52452/layer_05-model_00-model_states.pt b/global_step52452/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab2e889467b112299841c10ce37ba1c62e48a97 --- /dev/null +++ b/global_step52452/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9194b8ee71b7819eee6ff24dbb8f1b928d830571af1fd643cf987a4733f296dd +size 157357315 diff --git a/global_step52452/layer_06-model_00-model_states.pt b/global_step52452/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f678aa84a23e44834a0826699a969fd892ce5f0b --- /dev/null +++ b/global_step52452/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b548351da4836dd015ee915ac5d9cd39e97278da4c27c0b0289ca503e20438b +size 157357315 diff --git a/global_step52452/layer_07-model_00-model_states.pt b/global_step52452/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71dd599a1add25f55e9d2edd09b5ab9c171de521 --- /dev/null +++ b/global_step52452/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae191ef9ac49222a55bf67ba95325f32defc1617ac006e98661665a2d418342 +size 157357315 diff --git a/global_step52452/layer_08-model_00-model_states.pt b/global_step52452/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a842c8fec7eb0fcf4373131bb72b0a4803de2c --- /dev/null +++ b/global_step52452/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbae5119398cef05b01840fcdf4641da86f3b5432e3534b07e50a002e60d8616 +size 157357315 diff --git a/global_step52452/layer_09-model_00-model_states.pt b/global_step52452/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c6c92a5635adee9d77cb8fee31697763e21d6a9 --- /dev/null +++ b/global_step52452/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5387a8248428b37d3f569989a94696c6610abad81f41549b0519106cbb84f371 +size 157357315 diff --git a/global_step52452/layer_10-model_00-model_states.pt b/global_step52452/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..303a00079917eeec51117064886bb1bbad8f8e85 --- /dev/null +++ b/global_step52452/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6d812e225b7eecc2ff77f98cb0568df7b67474f698febd099a4cca3eb0ca33 +size 157357315 diff --git a/global_step52452/layer_11-model_00-model_states.pt b/global_step52452/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04d9c54d63c12a7a26f620a3d46f327673b71b8 --- /dev/null +++ b/global_step52452/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2906196421f1637145cbe5d34bba26e6e033d9a3a0bbf52675625e185c630771 +size 157357315 diff --git a/global_step52452/layer_12-model_00-model_states.pt b/global_step52452/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fafa3054a6c174e56394a5edfbf78be919a27c4 --- /dev/null +++ b/global_step52452/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f9fe12a5bf7476f69680901b9d28e6fec8e2f0c85e786ae4cca7174e9a875f +size 157357315 diff --git a/global_step52452/layer_13-model_00-model_states.pt b/global_step52452/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c9112a50d86615401004199fae38ae8ec396942 --- /dev/null +++ b/global_step52452/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6871ccd04945dd890bc0d086e0fb19ad8aacfbb126f8ca7f824578f76dcb67 +size 157357315 diff --git a/global_step52452/layer_14-model_00-model_states.pt b/global_step52452/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda39fb127c2961eb72c7c3ba3c1008aa1fb2ee7 --- /dev/null +++ b/global_step52452/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d75c6f4418343417b444c01f9041985c0a3af8f453f975b6028208ea78924f4 +size 157357315 diff --git a/global_step52452/layer_15-model_00-model_states.pt b/global_step52452/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac43d5660018fdfcca6566ea7c579b269ed53c90 --- /dev/null +++ b/global_step52452/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4fb6b54599a882a78547c30c4de0efc117cefc44d63c0d27636c6bfea389de4 +size 157357315 diff --git a/global_step52452/layer_16-model_00-model_states.pt b/global_step52452/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..044b16f2487faf54ac4d664fc21dd9a4e2c85bc6 --- /dev/null +++ b/global_step52452/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:831729e14e545fc9b461453e97b15af210077d1261d783d06a52871ea323d741 +size 157357315 diff --git a/global_step52452/layer_17-model_00-model_states.pt b/global_step52452/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2474da108600a00b2ae50bea61c607d43f9d148 --- /dev/null +++ b/global_step52452/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743e53ab0fac06ffbda75ae7ac756150e33ccdbabcc7375a0e1bb595a776e72f +size 157357315 diff --git a/global_step52452/layer_18-model_00-model_states.pt b/global_step52452/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..255d9375e39bef880c376a71770b6450364e9fea --- /dev/null +++ b/global_step52452/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56c2db6068ea05ed11bfab52a359d9acb18fe90f59371c1158ec179b6e540f9 +size 157357315 diff --git a/global_step52452/layer_19-model_00-model_states.pt b/global_step52452/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be74b1a74d050ffdbac0049fb26af224c5c616e4 --- /dev/null +++ b/global_step52452/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381669f1dd605bb2ee6b89b4ecf292665c775a9b6ad34acf5b14007c7fb0acf5 +size 157357315 diff --git a/global_step52452/layer_20-model_00-model_states.pt b/global_step52452/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8725b497df8d0ed84617015c51dd69460e99aeb6 --- /dev/null +++ b/global_step52452/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e11871408ef8e412a27276a490fc0e6df456aed540c6b243ebf413dabb023e5 +size 157357315 diff --git a/global_step52452/layer_21-model_00-model_states.pt b/global_step52452/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1ca61ecefd409ee471f954f67647dddbf430c2 --- /dev/null +++ b/global_step52452/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad86bca7f78b461cedb510c9f26887c685162612bbb3a9d9e3a67cac20159e1 +size 157357315 diff --git a/global_step52452/layer_22-model_00-model_states.pt b/global_step52452/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ac6e9fa3c8c956fb668e9354f394ad00625e45 --- /dev/null +++ b/global_step52452/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60d5803f9940774a914cde82e7d3f32dc830389fcf4a7fa698903c3428b55cc +size 157357315 diff --git a/global_step52452/layer_23-model_00-model_states.pt b/global_step52452/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca3859a187f62fbf78b3c425848b7b6a2e4a12f --- /dev/null +++ b/global_step52452/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b319e8f979c6aabd1def9418f4e7c3825f19472631af4ec00aae6e0f949b7eb3 +size 157357315 diff --git a/global_step52452/layer_24-model_00-model_states.pt b/global_step52452/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19e75c8093cae537e55fe41034eb94ea00542c31 --- /dev/null +++ b/global_step52452/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dfbe645348f9ce72eb14a5f6290ccf0b9ad748284aafd3d6cc7d30baef26751 +size 157357315 diff --git a/global_step52452/layer_25-model_00-model_states.pt b/global_step52452/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59ad2fc0d5532ad9422d261938a94ca2340e1cf --- /dev/null +++ b/global_step52452/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd353b98b60b2136d95a360e8934cd9c7ee0212c0650151a1e82f82a67da571 +size 157357315 diff --git a/global_step52452/layer_26-model_00-model_states.pt b/global_step52452/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a23c67bd9e19ff220e206d7f84e66154e44a2e8 --- /dev/null +++ b/global_step52452/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954fae323994f5ad0c138928147bde7258a975282653a26d134cdf3bd6245df9 +size 157357315 diff --git a/global_step52452/layer_27-model_00-model_states.pt b/global_step52452/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c86ff76becee63332e149fb98733a3df932795a2 --- /dev/null +++ b/global_step52452/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2e49ac3809ef465638194de29c289a465352499ea60a5fa74e8dbc22cb4f05 +size 157357315 diff --git a/global_step52452/layer_28-model_00-model_states.pt b/global_step52452/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d692af766306ab00e5a68ab42c4a06914ca66bc --- /dev/null +++ b/global_step52452/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf99773f33fa99b65ce020f3da265a9e3313d764032c6155e0343ef4ebb3e27 +size 157357315 diff --git a/global_step52452/layer_29-model_00-model_states.pt b/global_step52452/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64542164928a58f5ec16ae943b8169975c79bb70 --- /dev/null +++ b/global_step52452/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8328ca20613e506f7119fe836372e535fd688a9e5ce5abdde15fe998a477be0b +size 157357315 diff --git a/global_step52452/layer_30-model_00-model_states.pt b/global_step52452/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbe06e70dd40c13d591745d09c70a48ac226cb19 --- /dev/null +++ b/global_step52452/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f170b6bb7fbc56161a79465bc11b76b7e1aab127ef3cc80a400b1ba057a5d5 +size 157357315 diff --git a/global_step52452/layer_31-model_00-model_states.pt b/global_step52452/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5a9502d6e9db30d5a8e9435b394d2867438c7a0 --- /dev/null +++ b/global_step52452/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fe7d67718cd465c2432b55ccccacf594f93be8480145d746733f8467af9e68 +size 157357315 diff --git a/global_step52452/layer_32-model_00-model_states.pt b/global_step52452/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..526be5aff6149cf9968690f9f3df14141645c7c7 --- /dev/null +++ b/global_step52452/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46e09181e4da9c4b57b0d5f8ae59aacf108365ab6b4508ed600831470400421 +size 157357315 diff --git a/global_step52452/layer_33-model_00-model_states.pt b/global_step52452/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90882770d4a94aa507b32f366933f0bd8ab872b --- /dev/null +++ b/global_step52452/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:343fa65a4fb969ba97f9f97ccb63aa43ef0f71a23567124ac969e9257c11bf36 +size 157357315 diff --git a/global_step52452/layer_34-model_00-model_states.pt b/global_step52452/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1abc7277647bcd6fef481474b16d5e2ce9b5b256 --- /dev/null +++ b/global_step52452/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03db034b8b008b22f9ee144e1f52560ef69df81eff37bf2e1147b801ad5741c5 +size 157357315 diff --git a/global_step52452/layer_35-model_00-model_states.pt b/global_step52452/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0b0c8002c5b6195045d436d6160365ebbb0f13 --- /dev/null +++ b/global_step52452/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f387a665d3f94fc10c6ab24aeb649d00a47939751cedb08341c5ca01254d2af7 +size 157357315 diff --git a/global_step52452/layer_36-model_00-model_states.pt b/global_step52452/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..974bafdad6c3f970c698228f0b319e6e461d9abf --- /dev/null +++ b/global_step52452/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19f976c81b35606d049c41c861d4716601ede0c70d1fcadd00e6d907605c6e9 +size 157357315 diff --git a/global_step52452/layer_38-model_00-model_states.pt b/global_step52452/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b14865cd3b7eae246130a8691001655202140fbc --- /dev/null +++ b/global_step52452/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2179bf09a6bea5a15c18dad917c4471549e98541d6ed5db9e4bef25b654aa243 +size 11459 diff --git a/global_step52452/mp_rank_00_model_states.pt b/global_step52452/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90780e43769a483bed6a23c1d62e8b5da0839605 --- /dev/null +++ b/global_step52452/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb4c643f861ade3ff8d1a8331eed67e953e6d34b4cc77ccf8b0f52a0891a687 +size 50483 diff --git a/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675416872.nid007045.14369.0 b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675416872.nid007045.14369.0 new file mode 100644 index 0000000000000000000000000000000000000000..9f1ea478502d32a225fc75b280cf1732ac0d3623 --- /dev/null +++ b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675416872.nid007045.14369.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da9c481fbce2981da4bd28355599ab4756f8f92de738ce19a06c58d9d32c996 +size 20447 diff --git a/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675417560.nid006815.14328.0 b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675417560.nid006815.14328.0 new file mode 100644 index 0000000000000000000000000000000000000000..89afa909c52e080569691a7c7d97afdf272405b8 --- /dev/null +++ b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675417560.nid006815.14328.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27fb3b196d85cebd604985c5cbb8c018f5672040dcf336cfd906068e151b1f8f +size 324518 diff --git a/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675418371.nid006524.39299.0 b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675418371.nid006524.39299.0 new file mode 100644 index 0000000000000000000000000000000000000000..2ed082cfcb1a2b4668308a50a7e38e7b5345c37f --- /dev/null +++ b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675418371.nid006524.39299.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c342293a6f94ff953526d629949c292f62091be348f01d20b75dee3b1061b46f +size 76278141 diff --git a/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675856535.nid005375.21043.0 b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675856535.nid005375.21043.0 new file mode 100644 index 0000000000000000000000000000000000000000..aafa597e86b353d794a6fe4167e075ec7c09a4cc --- /dev/null +++ b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675856535.nid005375.21043.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd2b8b54e9229fb73b34e702344ed2cc0ceb5a3fd4bd934d24c1a4617759b80 +size 40 diff --git a/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675859535.nid007001.106539.0 b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675859535.nid007001.106539.0 new file mode 100644 index 0000000000000000000000000000000000000000..52c7e7dfc6f9a65a437d0a1e59689599d48b09f3 --- /dev/null +++ b/tensorboard_2b855b55bc4ul2ndfixnew/events.out.tfevents.1675859535.nid007001.106539.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d7ba7225cbd45095b8e3e10de53bb333a9c4309d82ff3fc7ba3d88212033dca +size 18897602 diff --git a/transformers/config.json b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb00a0b27b44ef76dddc1b1d830ada6509d49e1 --- /dev/null +++ b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 53376, "n_positions": 2048, "n_embd": 2560, "n_layer": 34, "n_head": 20, "n_inner": 10240, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/transformers/pytorch_model.bin b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a055f0a32a76d8a6ec2e9b07808538ce252f669 --- /dev/null +++ b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd3dc0820a7a57c3f0ad20dc05cea17d7a1b5b0028959a8e8bb26c1ffadae24 +size 5919146061