Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +5 -0
- checkpoint-6000/added_tokens.json +5 -0
- checkpoint-6000/config.json +203 -0
- checkpoint-6000/generation_config.json +14 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoint-6000/global_step6000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
checkpoint-6000/added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
checkpoint-6000/config.json
ADDED
@@ -0,0 +1,203 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/mnt/bn/tiktok-mm-4/aiic/users/brianli/prod/checkpoints/llava-onevision-qwen2-7b-mid-stage-a4",
|
3 |
+
"add_faster_video": false,
|
4 |
+
"add_time_instruction": false,
|
5 |
+
"architectures": [
|
6 |
+
"LlavaQwenForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 151643,
|
10 |
+
"eos_token_id": 151645,
|
11 |
+
"faster_token_stride": 10,
|
12 |
+
"force_sample": false,
|
13 |
+
"hidden_act": "silu",
|
14 |
+
"hidden_size": 3584,
|
15 |
+
"image_aspect_ratio": "anyres_max_4",
|
16 |
+
"image_crop_resolution": null,
|
17 |
+
"image_grid_pinpoints": [
|
18 |
+
[
|
19 |
+
384,
|
20 |
+
384
|
21 |
+
],
|
22 |
+
[
|
23 |
+
384,
|
24 |
+
768
|
25 |
+
],
|
26 |
+
[
|
27 |
+
384,
|
28 |
+
1152
|
29 |
+
],
|
30 |
+
[
|
31 |
+
384,
|
32 |
+
1536
|
33 |
+
],
|
34 |
+
[
|
35 |
+
384,
|
36 |
+
1920
|
37 |
+
],
|
38 |
+
[
|
39 |
+
384,
|
40 |
+
2304
|
41 |
+
],
|
42 |
+
[
|
43 |
+
768,
|
44 |
+
384
|
45 |
+
],
|
46 |
+
[
|
47 |
+
768,
|
48 |
+
768
|
49 |
+
],
|
50 |
+
[
|
51 |
+
768,
|
52 |
+
1152
|
53 |
+
],
|
54 |
+
[
|
55 |
+
768,
|
56 |
+
1536
|
57 |
+
],
|
58 |
+
[
|
59 |
+
768,
|
60 |
+
1920
|
61 |
+
],
|
62 |
+
[
|
63 |
+
768,
|
64 |
+
2304
|
65 |
+
],
|
66 |
+
[
|
67 |
+
1152,
|
68 |
+
384
|
69 |
+
],
|
70 |
+
[
|
71 |
+
1152,
|
72 |
+
768
|
73 |
+
],
|
74 |
+
[
|
75 |
+
1152,
|
76 |
+
1152
|
77 |
+
],
|
78 |
+
[
|
79 |
+
1152,
|
80 |
+
1536
|
81 |
+
],
|
82 |
+
[
|
83 |
+
1152,
|
84 |
+
1920
|
85 |
+
],
|
86 |
+
[
|
87 |
+
1152,
|
88 |
+
2304
|
89 |
+
],
|
90 |
+
[
|
91 |
+
1536,
|
92 |
+
384
|
93 |
+
],
|
94 |
+
[
|
95 |
+
1536,
|
96 |
+
768
|
97 |
+
],
|
98 |
+
[
|
99 |
+
1536,
|
100 |
+
1152
|
101 |
+
],
|
102 |
+
[
|
103 |
+
1536,
|
104 |
+
1536
|
105 |
+
],
|
106 |
+
[
|
107 |
+
1536,
|
108 |
+
1920
|
109 |
+
],
|
110 |
+
[
|
111 |
+
1536,
|
112 |
+
2304
|
113 |
+
],
|
114 |
+
[
|
115 |
+
1920,
|
116 |
+
384
|
117 |
+
],
|
118 |
+
[
|
119 |
+
1920,
|
120 |
+
768
|
121 |
+
],
|
122 |
+
[
|
123 |
+
1920,
|
124 |
+
1152
|
125 |
+
],
|
126 |
+
[
|
127 |
+
1920,
|
128 |
+
1536
|
129 |
+
],
|
130 |
+
[
|
131 |
+
1920,
|
132 |
+
1920
|
133 |
+
],
|
134 |
+
[
|
135 |
+
1920,
|
136 |
+
2304
|
137 |
+
],
|
138 |
+
[
|
139 |
+
2304,
|
140 |
+
384
|
141 |
+
],
|
142 |
+
[
|
143 |
+
2304,
|
144 |
+
768
|
145 |
+
],
|
146 |
+
[
|
147 |
+
2304,
|
148 |
+
1152
|
149 |
+
],
|
150 |
+
[
|
151 |
+
2304,
|
152 |
+
1536
|
153 |
+
],
|
154 |
+
[
|
155 |
+
2304,
|
156 |
+
1920
|
157 |
+
],
|
158 |
+
[
|
159 |
+
2304,
|
160 |
+
2304
|
161 |
+
]
|
162 |
+
],
|
163 |
+
"image_split_resolution": null,
|
164 |
+
"initializer_range": 0.02,
|
165 |
+
"intermediate_size": 18944,
|
166 |
+
"max_position_embeddings": 32768,
|
167 |
+
"max_window_layers": 28,
|
168 |
+
"mm_hidden_size": 1152,
|
169 |
+
"mm_newline_position": "grid",
|
170 |
+
"mm_patch_merge_type": "spatial_unpad",
|
171 |
+
"mm_projector_lr": null,
|
172 |
+
"mm_projector_type": "mlp2x_gelu",
|
173 |
+
"mm_resampler_type": null,
|
174 |
+
"mm_spatial_pool_mode": "bilinear",
|
175 |
+
"mm_spatial_pool_stride": null,
|
176 |
+
"mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
|
177 |
+
"mm_use_im_patch_token": false,
|
178 |
+
"mm_use_im_start_end": false,
|
179 |
+
"mm_vision_select_feature": "patch",
|
180 |
+
"mm_vision_select_layer": -2,
|
181 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
182 |
+
"mm_vision_tower_lr": 2e-06,
|
183 |
+
"model_type": "qwen2",
|
184 |
+
"num_attention_heads": 28,
|
185 |
+
"num_hidden_layers": 28,
|
186 |
+
"num_key_value_heads": 4,
|
187 |
+
"pos_skipping_range": 4096,
|
188 |
+
"rms_norm_eps": 1e-06,
|
189 |
+
"rope_scaling": null,
|
190 |
+
"rope_theta": 1000000.0,
|
191 |
+
"sliding_window": 131072,
|
192 |
+
"tie_word_embeddings": false,
|
193 |
+
"tokenizer_model_max_length": 8192,
|
194 |
+
"tokenizer_padding_side": "right",
|
195 |
+
"torch_dtype": "bfloat16",
|
196 |
+
"transformers_version": "4.40.0.dev0",
|
197 |
+
"use_cache": false,
|
198 |
+
"use_mm_proj": true,
|
199 |
+
"use_pos_skipping": false,
|
200 |
+
"use_sliding_window": false,
|
201 |
+
"vision_tower_pretrained": null,
|
202 |
+
"vocab_size": 152064
|
203 |
+
}
|
checkpoint-6000/generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.40.0.dev0"
|
14 |
+
}
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:220d6d227d49cc60f6c084233de373ce62e5862feaa70f3534abfa08a45997c2
|
3 |
+
size 1505698422
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bdadc58b2695c52f49ce48349c0aedde52d95e2d7a8bc4c47af10d83ce7539a
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d0c009adccbd2f2cac6b3574ca64b981088c308f752ea0ec22a6599c7905fe0
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b7cb665ea94081b53575f75ec91fb57e72da2bc604ada1b377e0c5f08bba6d0
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfdfa161e7d1d814beaf207934f452b9c70bc238eb6239ea8eecca71ad0da205
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2181c07cf741f92a78a07a8ef2b5a08ad502c13782630c9b05f28f9935bf9609
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5d932c9148df0e5732add8bebb4cbf8952e5229b34598e58cc525b14b778944
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be5fee9ec99dbdb146e1f263b9ff61b834f928c975953670776d9dd3a9aca071
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0053ab54932d3deb83de39e6ed82e21efcb9e2e871e7e034e595fa2e6ea2aee3
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d508f74650be933a0dcf4be0bc496dbaf60abb40b8155aea5335176204a64322
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eadc85b97c17aa72b145dfc77f8f6fd6aecac8fec1e9ae1ca42c5cc1ba2f4635
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c52597edfd7605b2b79197738e16cc3d6b96e4e02f04562010dcb2709743dd4e
|
3 |
+
size 1505698422
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4c156223b61fa907b619c59c98e59308d5212a3ffb7f8e41fc67a5599acdd5f
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fd30f1afb47d6f7ab058d68777237f1978dbae8da4254cd4bcdebd435319a69
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e23a53e83005d949088d6507a59f9d40ab32206fe9573129d3088d9f9d39346
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101b50138890da67900be4ccea58ece98fb1891f36da1b9620def35a8c392168
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a4de862ca032ebc2cd430714406dcfdc4af07bb1d4c5a86e841f97b209fa1f2
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7453205b3376ccea183c191cdafbd2141dd1b8f3c67a93fd0ce7fc411211f7b7
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a260fcff10a546756333e412813f9cbdd20ad9eb29b24364495dfbd41c30ad39
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:121aef84150c1440104acd0dd6fb6ce92491b31bf7d608ea526f2cf1a433e2bd
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e4cece71ac3932d906f6e0e7f977c95590cb7e39aeb4aa3a2f5a9f3ac7caaba
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:140d80410049b0f7ec3382c2c9acfb0cd7d0c579301ed5c654b542a6568731e4
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0be87612d6ad284a5ee5f4365fc0d8b6cdd747dc36d6ad0d7f16b07560be99a2
|
3 |
+
size 1505698422
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6b21c05011d81d216b0d1c64855ea971873c43e59aeea7127996d935c0bc43a
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c64d4e4ac013a019ed48da9f717d72d5908078ab2efe485106bff5c61e5ff677
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e05c517cc4628eb35fe140843cb4167fbb68847bbaae16a8dbd82388bc5fc483
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a684471d7a4d0e7dc729dc9bf55ad74b37d91f52827130168d18872ea0148cf7
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31e52cb36d23ffeed397305553a386c4507b9c7d34c842f671e27522aa2b0464
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2ba7e7fc6a5fc2f25588e3e75a2defe4ecf813184d610125b4c0bc1550e7e7e
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afbbc824f1724dd78ab57d02c41a72ec0b8c992253f5d8fb1a3f46936709b036
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da3c6aa0f5d63223da62b6fc93e93d8382b5c348bd9e98decc4b3d1a85cb308d
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7e491992f43d2014faff938eb9a7e571760c4e3a97317b3555864dda899dc31
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cbdc0f8edf0ef96b3ff075e620123cd31c5848a3db35ba994245e668eb0c391
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3830403340313eebdfd0f3b23cb5ce42b464e886103b4d556012faba1cba9f1
|
3 |
+
size 1505698422
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b35beca21e2c3fc597d89109a4d18beb0a13984cb88fa3ad15ec9c9feb5e42bc
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e2548854f30c286b93f1298e232dce50cfade20fb71cbec60cf6170af16bc7c
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5d165ebeb38e7558b92b8be7d7202c300c17d6b96dbe9dfbdcd8acb75722e48
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c92035cd2cfef2c04d82e5c9b1f7e07abcc4d61756d6b3f7b2345e593c69921
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b247c5077dc11cd851caa8c1d4be1dac99551f40f227cf6c390b25fc13efc965
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8439b389bbd4562dee142eccdec82763b1af80ff4b89241c585588fe0479ac6c
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19d8ff7be157a55112e6f1ae934f84655b91015f11d21f65019b890dc60630d4
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d120195e414743f6baf970ca64e1df04064a378fc8c9d3ae6bbbca5d557ad4
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ea834ac90068533e51dbf52bf4667bb1bb8e336db9ce27aa192849d82d04c06
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62fd49c90a850c7d4aca67a8be8dea825cc9db216e32dea5512ec9e58a58d9f6
|
3 |
+
size 1505698442
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db04bafd2453652599354e454a3d044e0f6ca49b0c464a09b9b7c43a9597480f
|
3 |
+
size 1505698422
|
checkpoint-6000/global_step6000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd78325cf51026cbad98158bdbd9f12ab40817fbedb8c9f4c4f554bd0b840902
|
3 |
+
size 1505698442
|