diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_31_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_31_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c0276e9a9adac725cd09c866800cf7586c596b --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_31_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ea25e053adfa9fc9a654897264eb9bf469d2253d81b952f9180bef5a0e15a6 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_3_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35496c458fc0510d77306f01618938cc57f56d19 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f910b8a6826b4fcb82516e53b3c35ca2412a4950204baa3b3814be3569c98ebb +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_4_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_4_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff327e383b649ff686255651c3d61f16cb13529 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_4_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18db89e3718a52849d725cf717b63ec0b6ea845a9a40057020809979fe42893a +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_5_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_5_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d7dbedb9ff2690e9f91eee0c693acdeadad604c --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_5_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9935b1af00a6ed77a9bde254d5c86eaa4f50e1ed6daf19e953da27ae8e0e8b1 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_6_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_6_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d8b9b75234a688f2de670c42705bf262f92502b --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_6_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c025e1902057f64b85809163dc16445df585eb6254e539e3467eacb5b61128c6 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_7_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_7_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac12d2d50a83529fc24eb3472364b277acf608c --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_7_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f900cc450707f6f2d6c503ad0835aedc1784e6d8bb2e38843c2aabaf969776 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_8_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_8_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8edf141671669494baf65b691937cf6500ff9f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_8_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c25b3ea2279f1fcb38786448a7faccd323f57134f543375740e21ecd9b75cf0 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_9_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_9_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6406532aac8f5be57fefbf91746b5423a8af4549 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_9_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315c5da4f8330b8689e20b91f398af841d096ad10d17c3f45f299a237620cfdc +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e11edc726d931634aab8066df7373fe1a5d36f7 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8b3ba62b181d52c071f83a53a73b199f88f77f0a9db95e4cf8b765c047007c +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..201feb1de302b600cd58168413f6139ccfab57a1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa6ce6f86f8a6268d5e5836033050f1db5e58790459cd5183975283890b297a4 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f4b2d020083c26d131d0a9359b30d9b29c2e106 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414747eb8eb04949e3160f85efbe6200b03d17e3b2b64e338ce2f72dd1711ae3 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5ca01799450aec986bce4fc6bf1628ba1289671 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232b5f8de48d809727ad624456b7514834c3cc38ac94dd8d6932976327691e53 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..107074dbc5d9d078d4b4e1d786db2a534541aa85 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb5564369c446954cd20e69ce7b0e382e3edbe8a1beec772079ad24561c9d782 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f80f9ad97a00f05e11031d7da4b928d38929a04 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258be8527143e86b35406f0f299629c04bea5db836ced20fca22a663ba9e74fc +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9d1c23bb1481a0619bb1185e368dcd731765c51 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5744c0208b8bb995d9b2dc3004b91afaccc04d4e623a10cdfd2bd4253371ad +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..327a06ff7a6045459e487b25ca724505d0676d0f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70770ab4f90865dc18412573636e641bdb0df1132d4a7e4aa30b0a70bf0fe35 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f194f94920bf84f9fa1ca8d423fd95574a1e3c0 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d483326f9dcb28e1ec22efb44d61b739a23982ed85e2996d8c4b2a26ffd0dd +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afe02e39ee18197b23f4bd4a7525a24a1289db82 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de59c726aa0c526034c48fbe269efcc6fb0a4231068b81c2f70cc6c6ae17c796 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99e6ee36bdb767ffc47fd5d4d2edc29022fc049 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3218b72b8c3b9de1fecaf89f89c6bca92f5135d0206144923a5b1a6723ddcda1 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08d5b31ca74b308f01b8e47bf8b55d2f29b16c4e --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686c56b00d551dcb8b8aa914254a08c3ae6c84221a28cbdcedc04fc5d8a5a8f7 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94fc40d0cd365a41bc18b6a42ef5704ba79b8f07 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666d94e65dd057bb988ee8b0c72aceffb252327435737748609561eff1b10416 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cbf843ebbcb2bae2feb646abd24e006d88fceff --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178b7e81eae84ac10a3237dc9afc810dd448fa6ca2c6b50cb9c27317d387882f +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..673a00f432288a80a149b676a2c1da242c7e8f6a --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91255a4d4e9121544de14b6ab87918fb946596340ceddcf8d7fdd3f66c660e99 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d531bf5be000c47d23ae5805960782098e60d2aa --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25c7b37f8db0d738f0761d3f1aa9dc8adc5485a526ca88bf8d162977d2d29c4 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef85f53284d0029dcf32fa4c6db6ced230a66281 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b499dbc2f001ac27f5fb20d92997ac31778c02b8b9f6d28081fbae57f8277382 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64cfb46f6335e2234bd9d57e4a34115db15632d0 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd6bedc63207232f56294e8d4b6ed7116cf344840bc88be572c9c828d36b30f +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64eb264185358ad829f1c3a584fbe713334d9a6 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f475dc0ccd0072ce0880f81f54bb413bf53ac47acc1f376fa19b321a89f4fc05 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a4a23ace1bb351415085a997a77a268b151aad2 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca409e456f3ad1da83a290280eff714f45ae7b02682c1a61b36a1cf45c0c7ba6 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dde9f2aeee209a0189b57338207d60d3b562edc --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3890d34e8be5d28b57c8ce6b173fd4be7d0ce02ac101a0fe1174be8d427f986b +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fccaaa5a6d1400ee533a46d5d26d8eef0706aa --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff094e8131732963d9280497fe3807af154a2a100c85fd9c6f0f35cbe056045 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c9c38bf6c34126ef8e2b2b46ebc6df91da09d79 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55746bfe9388f6c3492bd527e0b24bcc4d3d5eb4f3d63d5d914b7c33c9790441 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aec55d34bd8d3c4bfe82cc9e28529761197e3f1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c7cd2bbc7c8349a408f09aac2418c2bf58fb350d179f653bdcff1191771affe +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef1b4c4a02a615e7534414acbb357e941db40a3d --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf11329c35a291d587558a3718635a3f1619db132f2cb4c5c198b14df25ca73 +size 229713809 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01e4ae2faee9a1bf4ea463faa00e5d24e6c675e --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f24552dbed19cc3c8b64eac0f5207bd33bf7025ea4cbb0da3cd0162b1734a6 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ce608473b3dd3dd51fdef088b26e52452ccfe0 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26acebf92a85fca863287859dd1de562e6cd045b07dc0282b6806cce14a1cf71 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b456e8062b85fea6ce9e9ef1e76f7031e328787a --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799f22915883ac47d6867d99366e04e0a66ce282767bb2c9ffcd951a45168e13 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3170ff6a5da1cc5aa6fb6cc353e9cb1ea5ef192 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35db4635ad2a4ed9d534ba844d2d45360768bf7068004bd5ec4dddc1078488d3 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ad95904c8c58c47d23a9e5927d12c22e557537f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d4cc1fbf083b209f7cbdadd54a780e4d61642324527301f766310737396d2e +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81de37ceac32962b8bc71e0edb9d7841dce7a84 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24352b632299a2b63ed4c4ca23517c0b19eda877f2ceb606e5124565480fac51 +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefc1ba024d5ebc773733e5eb165bde0af2754e9 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a4a875cd95f118b32f1872bb4a638f4e3ae2882576db048c99a7cbb92dbc9c +size 229713797 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_0_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1310bc229821939acdddfb276f78dcc0eedd550 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619fb7612ebe1aad26b276ac47f553ee3efa96dca289665d54e75b91f09b0a04 +size 158167 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_10_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_10_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb9984ef2d94aea1cfeeb0b54ed48aeba800f40 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_10_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9732908f2ea186f30547e02ccf5589101272b2351e5a45c6332707fd3a3f12e2 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_11_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_11_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c653cecb3c8b9124ed96b2a4156c156b199cb437 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_11_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3897b666472a16ce29f38f5fcc466b7feca10e691b4e95198a645ac5f210b08e +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_12_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_12_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ba306c15a209345cef8a044159b4b5e420c5a1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_12_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9977abf3a5fcea1d51ae83e62ffebe3023d7cf1da7052d659355d46e10a56ed +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_13_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_13_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c664f2dad0d39036a7f68a982c410ca3211b756 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_13_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108c0d09dbe2b3375136f42c8628dda816cb1f3db0b694cce8d2310e5a33d181 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_14_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_14_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b19290e77ddf194f4bd9f92b67c4f3dd5ec7e16 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_14_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a479da97e476e0ca3ec9639136ccd811bfaf505a95166350913f6b02a976440 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_15_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_15_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a6d166e7e0c27d9bed572f2914b89d95bf629cd --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_15_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd35c86146520e48b14b4662a4ad9dbcc7c9d5a4f9d17d044153dc21295bf68d +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_16_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_16_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d055a5d25debbf6dc4a2b75b1e1489ee21ccbc --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_16_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8002bbe0a203d949ca0adac3ef9f655a1908838520a12836cdb995408af671c3 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_17_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_17_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62e7eef535a44e9a62afae8cc4d763ccbe29a1b4 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_17_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e8fdd9d2e2e1e7cc08694e958a4434405bd88a2dc938fd9ad6063b2f4c4dd54 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_18_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_18_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8147a1c2ef464fc501b833a1325c32d4daa510fb --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_18_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bbea1f4600dd404d30e247df32f6713bdb92654476643350c80c0ee3e503e21 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_19_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_19_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6516fbe088d37666bbee7afaa8d32277c6bda07b --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_19_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f527b3b2b11b5cd9f0b05998a215c6b94096c17e8420406c9287148a70c1d7a1 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_1_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12840aba7c4d408f25fec5c172fb25c43090dae6 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf758d8908f518e609a6bed8068950bfca4cce221071ce54f423e0a093fba11c +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_20_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_20_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efed628a09692b3a4f805837c4e97eeaca8c0993 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_20_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81547d86f1d3a92e868474e47bd1cd3039bd1f522524e68a7b4c91e71a0a0460 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_21_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_21_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b17306533521753f1eb1f68c593a801441db8fe1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_21_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9db930d15cfe143bc1d6aef4a393ed5ff2fc7e90338c7e9aabc7a8652730235 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_22_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_22_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab088a9f44c47d64594a32962be5e5cb0458de1f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_22_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e797af5ec9d0f2f53799e283c5890dc9fd4923f8f39e3fd407bde69f55cef0 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_23_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_23_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b093e510bab53fe58f6284021cb00a6454cb97 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_23_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb9a6ec878e9d9104e2f3ec784f1ce8bef1f5ed83b9fca23243d6d9d9d68aab5 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_24_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_24_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca684f6f4402491d4cc05ceb4a8ce1e103977b0a --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_24_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5dc860e256a2eeecd13f0ab971193a2dae9f82a04b350ce6961bb42990eaef +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_25_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_25_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..254745f43727fb0556cc34386714a4b653e26dde --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_25_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487073c61e9c600c8d01f1f7c314bbb141c934735a3b97265d79bd0cfccc4c91 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_26_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_26_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8c45d6b932eea8315c7f41299f3b013a96cb000 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_26_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e502eb329637bfceeccf8e7eeb6516886188f85f996c7c66116914d38dd8661b +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_27_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_27_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b65ba593feefbc95e114cfb96ff7b10b17160a1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_27_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd69b722c2030008cbf04418cac116dc67068dac559c5cb27883d1c666c9a4bf +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_28_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_28_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b547fdb76f0a4e4ff780640d12f90a46d6c05fa --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_28_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10cbdb77b75c5e484742e6b10143af7c1a3c0547df6e2c2a6a5e752566b4beba +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_29_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_29_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d7389d26d69947df9ade3c5418e4bdcad3e0d68 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_29_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a11f3f62d1263a5419d192801b0bf045b1f582b173d0c1093a0a7ebe40f2eb7 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_2_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6164d8c22f9e46f3d6fcb66a57f904ac95b17ab1 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f7a2f105311b6ff3ff794849e67a5c1b9a5fa815dccaff5bf0c97a48ba865b7 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_30_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_30_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7559486e3ab93fe5e335b4d4d8111b0175c30f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_30_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18837ba2ea6fc722c980364e63aea5c48457553f131fcaafb2333062635347f4 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_31_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_31_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87617ac8b00efb71c7a2b9545a681a1131fdecdc --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_31_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b3da4bf2aae8d24ed5377bfb59bb280ef9275cab5e63a746acabb50bc53863 +size 158419 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_3_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5569eb913783e3753baea4308c58b231eed09de --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c175a37199be6b959a214316515a99409e084089afea0e42e801c935383f579 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_4_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_4_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ddf6b594a21181c33a4ab5af293a354faae6926 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_4_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0f19f0d0d2d67942753bc8f7eb0a436ae07473d4eb21d8ccd5fa12a77acad1 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_5_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_5_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0f14bcc1d0c7698a61f51bcba0061826de661d --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_5_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:943943c230440d4f1d1e163e82c69db8746421a651914972a9b184340036b65e +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_6_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_6_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7af7c6ed0923c1fe841dc06cd127ce45d8ed0ebe --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_6_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0657b3cc063d23c622d6bebb49c9bfd36a29d3ce7be20a10b7d4e9feb9b112e5 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_7_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_7_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9eab5b2869fea0633755dbc66bb789336c9115 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_7_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2fb95d111ea9906371b27aba964a34cf18d6774d73ee40d25db30572b7d597 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_8_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_8_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ac233417fe7e7e7fe3c08b485e44cbe8ee84e38 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_8_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6486b8e222316c1d1eab78da8609a9bbe4fe39c418522af6d5a615245d7bdd30 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_9_mp_rank_00_model_states.pt b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_9_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abe4d6975a3202be73c43cab1f8e2f6240381b5f --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_9_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6baa3d9778c860d6be15f09ca02a9c56a71e760232925c06d0b8f51e8946b937 +size 158103 diff --git a/output_qwen3_plain_ar/checkpoint-907/global_step907/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_qwen3_plain_ar/checkpoint-907/global_step907/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3be267fa36f51656beec4ab3e74f02b36e62e32 --- /dev/null +++ b/output_qwen3_plain_ar/checkpoint-907/global_step907/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c90d4cbfefda798bfdc399aa89b0c151b603f0811883d4c03fa2eb09919927 +size 229713797