upload model
Browse files- .gitattributes +20 -0
- added_tokens.json +3 -0
- chat_template.jinja +3 -0
- config.json +3 -0
- generation_config.json +3 -0
- global_step45500/.gitattributes +8 -0
- global_step45500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step45500/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step45500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step45500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step45500/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- global_step45500/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- global_step45500/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- global_step45500/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- latest +3 -0
- merges.txt +3 -0
- rng_state_0.pth +3 -0
- rng_state_1.pth +3 -0
- rng_state_2.pth +3 -0
- rng_state_3.pth +3 -0
- scheduler.pt +3 -0
- special_tokens_map.json +3 -0
- tokenizer_config.json +3 -0
- trainer_state.json +3 -0
- training_args.bin +3 -0
- vocab.json +3 -0
- zero_to_fp32.py +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
vocab.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
added_tokens.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
config.json filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
generation_config.json filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
*.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
scheduler.pt filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
rng_state_0.pth filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
rng_state_2.pth filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
rng_state_3.pth filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
zero_to_fp32.py filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
global_step45500 filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
latest filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
merges.txt filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
rng_state_1.pth filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
training_args.bin filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
chat_template.jinja filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
.pth filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
|
| 3 |
+
size 605
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd8e9439f0570856fd70470bf8889ebd8b5d1107207f67a5efb46e342330527f
|
| 3 |
+
size 2507
|
config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebeb2c8c5b579645b34f43a9192d77e869763cc4a71f16515a0d6661b6a6fc6e
|
| 3 |
+
size 1325
|
generation_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69dbae630519cf998049cce7936711f8a33ae1cc0f0859c81a1e8ad0eec58fcc
|
| 3 |
+
size 242
|
global_step45500/.gitattributes
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
zero_pp_rank_2_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
zero_pp_rank_3_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
zero_pp_rank_0_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
zero_pp_rank_1_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
global_step45500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39107ef2a1b29e683d76017e80e3b9e3332162769c82e0b4d539d5195c963b5f
|
| 3 |
+
size 22846856147
|
global_step45500/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b172e8f04d0ebc51d9b3ea7c3edc9be4a63ef1993f78bc4ee637d972f62de211
|
| 3 |
+
size 22846856147
|
global_step45500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92ca3daa732047e77797f3308d87f6175d2ed967fe63c98a648a43c463840b04
|
| 3 |
+
size 22846856147
|
global_step45500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7204ed2655b8bede36dbc51780e5806729ed5b651a0abac3805f7c98c6878186
|
| 3 |
+
size 22846856147
|
global_step45500/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:356ca5c65924b0cc0a37dea0a442bea30970e94b22091234c3777aec29309259
|
| 3 |
+
size 174112
|
global_step45500/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe8213d2057e928009c30d60313ddbe36914f491a3c4cb9fb72d00b375cbd8a6
|
| 3 |
+
size 174112
|
global_step45500/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fea6f2020c6a62a475008136f0831b9d8c044ca3f2e54598ec19635d261039f4
|
| 3 |
+
size 174112
|
global_step45500/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b3e98dcc94f9f973ed0e25e6cd2ea9f8ebe581ba45bb7123ccd3e8096367b12
|
| 3 |
+
size 174112
|
latest
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88c3e5d99756c35b50f23a6674c82d5c9eacade908c5e6efbf5c0621dd7db10a
|
| 3 |
+
size 16
|
merges.txt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5
|
| 3 |
+
size 1671853
|
rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fe6b873f1da64bb980afe982fc1c6b6bc461ad8c33073d856804323f64b26d9
|
| 3 |
+
size 15429
|
rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13db4dd10b22b5464f5ef0b539152b46390eae6a827b355108cb54b1af2eb830
|
| 3 |
+
size 15429
|
rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06e293f13fb6e873e8081636b6b07115410b397c55f1ed08b8772b059c8eb74e
|
| 3 |
+
size 15429
|
rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c595c077664f94b7f91088561951be20e39483e01865774a83bc46f3971a3152
|
| 3 |
+
size 15429
|
scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:551f0698a3346a2138b76f80a9272e2c29faeeb78ac0d8c61e514deecb1ca24e
|
| 3 |
+
size 1401
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd
|
| 3 |
+
size 613
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f06d54777a4c59c23ed608b2529c49f6a66853df9bc8a254d52eeb3b99d7c827
|
| 3 |
+
size 4712
|
trainer_state.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2fa393e5fba106833b340abd9bd86cb1a6d5e5685eec3e8c95190d90234f0b9
|
| 3 |
+
size 796227
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11fb0cbfa791291738d24f59d23d3534f04fa18f29ce10cfe8703797019a5d38
|
| 3 |
+
size 6161
|
vocab.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87a257b04b17642a0688c98cd1df89c398bda4fee532d6f88b38a659ecb4ac8d
|
| 3 |
+
size 3383407
|
zero_to_fp32.py
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46497565ccf2b4a8b1f6f18c8341042f3749605a94335c81f69df1bd268af64f
|
| 3 |
+
size 33272
|