Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_4_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_5_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_6_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_7_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_8_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_9_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
- output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_31_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5ea25e053adfa9fc9a654897264eb9bf469d2253d81b952f9180bef5a0e15a6
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f910b8a6826b4fcb82516e53b3c35ca2412a4950204baa3b3814be3569c98ebb
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_4_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18db89e3718a52849d725cf717b63ec0b6ea845a9a40057020809979fe42893a
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_5_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9935b1af00a6ed77a9bde254d5c86eaa4f50e1ed6daf19e953da27ae8e0e8b1
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_6_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c025e1902057f64b85809163dc16445df585eb6254e539e3467eacb5b61128c6
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_7_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19f900cc450707f6f2d6c503ad0835aedc1784e6d8bb2e38843c2aabaf969776
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_8_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c25b3ea2279f1fcb38786448a7faccd323f57134f543375740e21ecd9b75cf0
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-7256/global_step7256/zero_pp_rank_9_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:315c5da4f8330b8689e20b91f398af841d096ad10d17c3f45f299a237620cfdc
|
| 3 |
+
size 158103
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad8b3ba62b181d52c071f83a53a73b199f88f77f0a9db95e4cf8b765c047007c
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa6ce6f86f8a6268d5e5836033050f1db5e58790459cd5183975283890b297a4
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:414747eb8eb04949e3160f85efbe6200b03d17e3b2b64e338ce2f72dd1711ae3
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:232b5f8de48d809727ad624456b7514834c3cc38ac94dd8d6932976327691e53
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb5564369c446954cd20e69ce7b0e382e3edbe8a1beec772079ad24561c9d782
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:258be8527143e86b35406f0f299629c04bea5db836ced20fca22a663ba9e74fc
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf5744c0208b8bb995d9b2dc3004b91afaccc04d4e623a10cdfd2bd4253371ad
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c70770ab4f90865dc18412573636e641bdb0df1132d4a7e4aa30b0a70bf0fe35
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8d483326f9dcb28e1ec22efb44d61b739a23982ed85e2996d8c4b2a26ffd0dd
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de59c726aa0c526034c48fbe269efcc6fb0a4231068b81c2f70cc6c6ae17c796
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3218b72b8c3b9de1fecaf89f89c6bca92f5135d0206144923a5b1a6723ddcda1
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:686c56b00d551dcb8b8aa914254a08c3ae6c84221a28cbdcedc04fc5d8a5a8f7
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:666d94e65dd057bb988ee8b0c72aceffb252327435737748609561eff1b10416
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:178b7e81eae84ac10a3237dc9afc810dd448fa6ca2c6b50cb9c27317d387882f
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91255a4d4e9121544de14b6ab87918fb946596340ceddcf8d7fdd3f66c660e99
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f25c7b37f8db0d738f0761d3f1aa9dc8adc5485a526ca88bf8d162977d2d29c4
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b499dbc2f001ac27f5fb20d92997ac31778c02b8b9f6d28081fbae57f8277382
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cd6bedc63207232f56294e8d4b6ed7116cf344840bc88be572c9c828d36b30f
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f475dc0ccd0072ce0880f81f54bb413bf53ac47acc1f376fa19b321a89f4fc05
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca409e456f3ad1da83a290280eff714f45ae7b02682c1a61b36a1cf45c0c7ba6
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3890d34e8be5d28b57c8ce6b173fd4be7d0ce02ac101a0fe1174be8d427f986b
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fff094e8131732963d9280497fe3807af154a2a100c85fd9c6f0f35cbe056045
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55746bfe9388f6c3492bd527e0b24bcc4d3d5eb4f3d63d5d914b7c33c9790441
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c7cd2bbc7c8349a408f09aac2418c2bf58fb350d179f653bdcff1191771affe
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:daf11329c35a291d587558a3718635a3f1619db132f2cb4c5c198b14df25ca73
|
| 3 |
+
size 229713809
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0f24552dbed19cc3c8b64eac0f5207bd33bf7025ea4cbb0da3cd0162b1734a6
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26acebf92a85fca863287859dd1de562e6cd045b07dc0282b6806cce14a1cf71
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:799f22915883ac47d6867d99366e04e0a66ce282767bb2c9ffcd951a45168e13
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35db4635ad2a4ed9d534ba844d2d45360768bf7068004bd5ec4dddc1078488d3
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0d4cc1fbf083b209f7cbdadd54a780e4d61642324527301f766310737396d2e
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24352b632299a2b63ed4c4ca23517c0b19eda877f2ceb606e5124565480fac51
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7a4a875cd95f118b32f1872bb4a638f4e3ae2882576db048c99a7cbb92dbc9c
|
| 3 |
+
size 229713797
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:619fb7612ebe1aad26b276ac47f553ee3efa96dca289665d54e75b91f09b0a04
|
| 3 |
+
size 158167
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9732908f2ea186f30547e02ccf5589101272b2351e5a45c6332707fd3a3f12e2
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_11_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3897b666472a16ce29f38f5fcc466b7feca10e691b4e95198a645ac5f210b08e
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_12_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9977abf3a5fcea1d51ae83e62ffebe3023d7cf1da7052d659355d46e10a56ed
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_13_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:108c0d09dbe2b3375136f42c8628dda816cb1f3db0b694cce8d2310e5a33d181
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_14_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a479da97e476e0ca3ec9639136ccd811bfaf505a95166350913f6b02a976440
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_15_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd35c86146520e48b14b4662a4ad9dbcc7c9d5a4f9d17d044153dc21295bf68d
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_16_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8002bbe0a203d949ca0adac3ef9f655a1908838520a12836cdb995408af671c3
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_17_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e8fdd9d2e2e1e7cc08694e958a4434405bd88a2dc938fd9ad6063b2f4c4dd54
|
| 3 |
+
size 158419
|
output_qwen3_plain_ar/checkpoint-8163/global_step8163/zero_pp_rank_18_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5bbea1f4600dd404d30e247df32f6713bdb92654476643350c80c0ee3e503e21
|
| 3 |
+
size 158419
|