Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +16 -0
- all_results.json +8 -0
- chat_template.json +3 -0
- checkpoint-3089/added_tokens.json +16 -0
- checkpoint-3089/chat_template.json +3 -0
- checkpoint-3089/config.json +48 -0
- checkpoint-3089/generation_config.json +13 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_4_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_5_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_6_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_7_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_8_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_9_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/latest +1 -0
- checkpoint-3089/merges.txt +0 -0
- checkpoint-3089/model-00001-of-00031.safetensors +3 -0
- checkpoint-3089/model-00002-of-00031.safetensors +3 -0
- checkpoint-3089/model-00003-of-00031.safetensors +3 -0
- checkpoint-3089/model-00004-of-00031.safetensors +3 -0
- checkpoint-3089/model-00005-of-00031.safetensors +3 -0
- checkpoint-3089/model-00006-of-00031.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|box_end|>": 151649,
|
3 |
+
"<|box_start|>": 151648,
|
4 |
+
"<|endoftext|>": 151643,
|
5 |
+
"<|im_end|>": 151645,
|
6 |
+
"<|im_start|>": 151644,
|
7 |
+
"<|image_pad|>": 151655,
|
8 |
+
"<|object_ref_end|>": 151647,
|
9 |
+
"<|object_ref_start|>": 151646,
|
10 |
+
"<|quad_end|>": 151651,
|
11 |
+
"<|quad_start|>": 151650,
|
12 |
+
"<|video_pad|>": 151656,
|
13 |
+
"<|vision_end|>": 151653,
|
14 |
+
"<|vision_pad|>": 151654,
|
15 |
+
"<|vision_start|>": 151652
|
16 |
+
}
|
all_results.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 1.0,
|
3 |
+
"total_flos": 3876169351954432.0,
|
4 |
+
"train_loss": 0.8143089480599218,
|
5 |
+
"train_runtime": 151234.6723,
|
6 |
+
"train_samples_per_second": 2.614,
|
7 |
+
"train_steps_per_second": 0.02
|
8 |
+
}
|
chat_template.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
|
3 |
+
}
|
checkpoint-3089/added_tokens.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|box_end|>": 151649,
|
3 |
+
"<|box_start|>": 151648,
|
4 |
+
"<|endoftext|>": 151643,
|
5 |
+
"<|im_end|>": 151645,
|
6 |
+
"<|im_start|>": 151644,
|
7 |
+
"<|image_pad|>": 151655,
|
8 |
+
"<|object_ref_end|>": 151647,
|
9 |
+
"<|object_ref_start|>": 151646,
|
10 |
+
"<|quad_end|>": 151651,
|
11 |
+
"<|quad_start|>": 151650,
|
12 |
+
"<|video_pad|>": 151656,
|
13 |
+
"<|vision_end|>": 151653,
|
14 |
+
"<|vision_pad|>": 151654,
|
15 |
+
"<|vision_start|>": 151652
|
16 |
+
}
|
checkpoint-3089/chat_template.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
|
3 |
+
}
|
checkpoint-3089/config.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/mnt/zhangh/sicong/vl3_data/checkpoints/Qwen/Qwen2-VL-72B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2VLForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8192,
|
11 |
+
"image_token_id": 151655,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 29568,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"max_window_layers": 80,
|
16 |
+
"model_type": "qwen2_vl",
|
17 |
+
"num_attention_heads": 64,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"rms_norm_eps": 1e-06,
|
21 |
+
"rope_scaling": {
|
22 |
+
"mrope_section": [
|
23 |
+
16,
|
24 |
+
24,
|
25 |
+
24
|
26 |
+
],
|
27 |
+
"rope_type": "default",
|
28 |
+
"type": "default"
|
29 |
+
},
|
30 |
+
"rope_theta": 1000000.0,
|
31 |
+
"sliding_window": 32768,
|
32 |
+
"tie_word_embeddings": false,
|
33 |
+
"torch_dtype": "bfloat16",
|
34 |
+
"transformers_version": "4.46.0",
|
35 |
+
"use_cache": false,
|
36 |
+
"use_sliding_window": false,
|
37 |
+
"video_token_id": 151656,
|
38 |
+
"vision_config": {
|
39 |
+
"hidden_size": 8192,
|
40 |
+
"in_chans": 3,
|
41 |
+
"model_type": "qwen2_vl",
|
42 |
+
"spatial_patch_size": 14
|
43 |
+
},
|
44 |
+
"vision_end_token_id": 151653,
|
45 |
+
"vision_start_token_id": 151652,
|
46 |
+
"vision_token_id": 151654,
|
47 |
+
"vocab_size": 152064
|
48 |
+
}
|
checkpoint-3089/generation_config.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"top_k": 1,
|
11 |
+
"top_p": 0.001,
|
12 |
+
"transformers_version": "4.46.0"
|
13 |
+
}
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e9af1bdd887a1da4b3a35821b9c173ad288d30d6bb27169f9c389484f75ec90
|
3 |
+
size 27264832986
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0549f952cf6f55d73bd5593e80f1153ef9f97516270a218b09e18020cee7220c
|
3 |
+
size 27264832986
|
checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e41434a5ad731a78a8dad2b1ef56d4d1cb8e41fca57d3e782e00822b3fb2621
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91ad25e50e28a70dd80e67648f833b84b88b8baf0f27c478fd14cb34e7489905
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c049a00ebf7e1e30fbeb2c4b6d6da7bd69cf27459b7886b7aafd75aea3f301b
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33f8c19548fae28f04bf6d71a44c3bbee777173465e1208c48ed4d75665f1106
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:965f500adc9dc48d10e97f0cd1f6c82eb16b2cdb1dd6174484475175406265d3
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ada2cbfa52a5681bbfd03b7215e0f7e2840a12a039fcac4e3eabd9d63c1c40c
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c882f6a86a3bebf481a99fef4f3eefcf7c1e692f7b9405268c3735dccbe5f8d2
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76ef144674ef9452e04a1175468dcf6d9305b0e61564788bbe87da7cc3c2888c
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:223d7ab37dbba4a4b14873b2fe86dec125bd8fd9e265620942831da2915fb994
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01c97513b431c66edbe12d2a70006952368038c67fc2cb272900e6d0e66b9709
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e5120dcc9bf408d6ca670be98e16670574b1ac931d7ee4fd4aae9ed8d316aa0
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46a67ce8ae0efcc851dfb916eed74e99a33f3d3f70a1248549b5f4119eadc907
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd189deeee01907e169f047d7eead0ed03b473722e88fbeb16aa2a81becafea1
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbe70438be54b97ce124c0002c8dbfc5819a99df7f819a8fa8609d3ecc7954b7
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ec1550f4a8bca06d9b3f45ac9d2954e093260e4a9c126eea126c5d7d98ba04
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add5a9277b6d6272ad6c9f7a2b92d33cc0b558aca26fdfc00869d81f38e12c4f
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e4de61fde067204c4b1fd75c14baac50576b32b0c70403cdf8b150d53e25304
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1c06aa5093120584a1efed49d1e45bc5054476c945f54e5c2ccd9f75a7d11d1
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4605ae8b1913f100eb953def115012e0612a9eca6e19f7d1a425262a84313477
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1996d756bf4976e4bf688a8f13a6ceb8e1bb9f89b447eded990ae372ef54b4b1
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b7a06abcddc4c3af4a0d3aa86bd0be13b2320587dc7a868a176dfc8d93eb5b
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_29_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34a62b2e4e0178139b92da488ed9f08ad4c3db98eb19586599340562af8a33fc
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbfcfff5dd0ea8985741ec5dc10efd4849babff293148f29d6c4962dfe31f3f1
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_30_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84f446e13e565029ee5a6c917cfea46acc17128c270d4603a496504c52c541c6
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_31_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0edacd886404b1ec1847ff0f1fa276de3c712cd80d92d8b8199c16ef5484595f
|
3 |
+
size 44481433
|
checkpoint-3089/global_step3089/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef52638e3827b7f3c5c2eed9001269e03c337c780988d905a8830734587117d2
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_4_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2521dee64bae1393a9d70aec44f82a261302f907ace41e785081036c9e4c3e6c
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_5_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a89df309ddc9916c596386daf668786315c6fc124d5045467aab5f9618a77a8
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_6_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6a495a92d5551d5d5c4a0b8e51b4ac6e0fee89e5788d90948b66bce8c0ab14c
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_7_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63d0db21fcd77d865910e86142b2ec7bb949d9cce83117c164900a97de0b28b3
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_8_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47fceef47d85c46b79db9195110086d58c47ee466661067bc16d9b40fe026305
|
3 |
+
size 44479684
|
checkpoint-3089/global_step3089/zero_pp_rank_9_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2ad852d3fe75b8bd0e1a811e0462c18fac478bcf0075b6ef7b013ce3604b617
|
3 |
+
size 44479684
|
checkpoint-3089/latest
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
global_step3089
|
checkpoint-3089/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
checkpoint-3089/model-00001-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a35db42a610fa0177bed31f85747ea9c6753f50e424c5a2033fc0bbb5531c8d
|
3 |
+
size 4676624560
|
checkpoint-3089/model-00002-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d75f14db98499d917166ea549a2590fda0ef8646303d87009f5a6f3385b865e3
|
3 |
+
size 4781670320
|
checkpoint-3089/model-00003-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e02cf6ba2f44a0b8ec9921255d7ab0b7b7b7cb62c186ca5d9074aac0eba45362
|
3 |
+
size 4964101384
|
checkpoint-3089/model-00004-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42b5dc8de56dcf15b7f46c058cda975edd3a0d3595563c815bfe515ca77987af
|
3 |
+
size 4781637328
|
checkpoint-3089/model-00005-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:200b6d5d9230fd0de547eb1ae87210faf45fc35a6793bad03d4b19222c408b87
|
3 |
+
size 4781670344
|
checkpoint-3089/model-00006-of-00031.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57e65e1295c4f183300eaeda92bd9b8c1544898cbb3fb9eb5ca021e4d2b99019
|
3 |
+
size 4781670360
|