jiachenl commited on
Commit
e71f1e5
1 Parent(s): 05546d7
Files changed (33) hide show
  1. .gitattributes +32 -0
  2. cumo-mixtral-8x7b/pft_stage/clip.bin +3 -0
  3. cumo-mixtral-8x7b/pft_stage/config.json +3 -0
  4. cumo-mixtral-8x7b/pft_stage/generation_config.json +3 -0
  5. cumo-mixtral-8x7b/pft_stage/mm_projector.bin +3 -0
  6. cumo-mixtral-8x7b/pft_stage/model-00001-of-00019.safetensors +3 -0
  7. cumo-mixtral-8x7b/pft_stage/model-00002-of-00019.safetensors +3 -0
  8. cumo-mixtral-8x7b/pft_stage/model-00003-of-00019.safetensors +3 -0
  9. cumo-mixtral-8x7b/pft_stage/model-00004-of-00019.safetensors +3 -0
  10. cumo-mixtral-8x7b/pft_stage/model-00005-of-00019.safetensors +3 -0
  11. cumo-mixtral-8x7b/pft_stage/model-00006-of-00019.safetensors +3 -0
  12. cumo-mixtral-8x7b/pft_stage/model-00007-of-00019.safetensors +3 -0
  13. cumo-mixtral-8x7b/pft_stage/model-00008-of-00019.safetensors +3 -0
  14. cumo-mixtral-8x7b/pft_stage/model-00009-of-00019.safetensors +3 -0
  15. cumo-mixtral-8x7b/pft_stage/model-00010-of-00019.safetensors +3 -0
  16. cumo-mixtral-8x7b/pft_stage/model-00011-of-00019.safetensors +3 -0
  17. cumo-mixtral-8x7b/pft_stage/model-00012-of-00019.safetensors +3 -0
  18. cumo-mixtral-8x7b/pft_stage/model-00013-of-00019.safetensors +3 -0
  19. cumo-mixtral-8x7b/pft_stage/model-00014-of-00019.safetensors +3 -0
  20. cumo-mixtral-8x7b/pft_stage/model-00015-of-00019.safetensors +3 -0
  21. cumo-mixtral-8x7b/pft_stage/model-00016-of-00019.safetensors +3 -0
  22. cumo-mixtral-8x7b/pft_stage/model-00017-of-00019.safetensors +3 -0
  23. cumo-mixtral-8x7b/pft_stage/model-00018-of-00019.safetensors +3 -0
  24. cumo-mixtral-8x7b/pft_stage/model-00019-of-00019.safetensors +3 -0
  25. cumo-mixtral-8x7b/pft_stage/model.safetensors.index.json +3 -0
  26. cumo-mixtral-8x7b/pft_stage/special_tokens_map.json +3 -0
  27. cumo-mixtral-8x7b/pft_stage/tokenizer.model +3 -0
  28. cumo-mixtral-8x7b/pft_stage/tokenizer_config.json +3 -0
  29. cumo-mixtral-8x7b/pft_stage/trainer_state.json +3 -0
  30. cumo-mixtral-8x7b/pft_stage/training_args.bin +3 -0
  31. cumo-mixtral-8x7b/pretrain_stage/config.json +3 -0
  32. cumo-mixtral-8x7b/pretrain_stage/mm_projector.bin +3 -0
  33. cumo-mixtral-8x7b/pretrain_stage/trainer_state.json +3 -0
.gitattributes CHANGED
@@ -51,3 +51,35 @@ cumo-mistral-7b/pft_stage/config.json filter=lfs diff=lfs merge=lfs -text
51
  cumo-mistral-7b/pft_stage/generation_config.json filter=lfs diff=lfs merge=lfs -text
52
  cumo-mistral-7b/pft_stage/model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
53
  cumo-mistral-7b/pft_stage/special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  cumo-mistral-7b/pft_stage/generation_config.json filter=lfs diff=lfs merge=lfs -text
52
  cumo-mistral-7b/pft_stage/model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text
53
  cumo-mistral-7b/pft_stage/special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
54
+ cumo-mixtral-8x7b/pretrain_stage/config.json filter=lfs diff=lfs merge=lfs -text
55
+ cumo-mixtral-8x7b/pretrain_stage/mm_projector.bin filter=lfs diff=lfs merge=lfs -text
56
+ cumo-mixtral-8x7b/pretrain_stage/trainer_state.json filter=lfs diff=lfs merge=lfs -text
57
+ cumo-mixtral-8x7b/pft_stage/model-00018-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
58
+ cumo-mixtral-8x7b/pft_stage/generation_config.json filter=lfs diff=lfs merge=lfs -text
59
+ cumo-mixtral-8x7b/pft_stage/model-00011-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
60
+ cumo-mixtral-8x7b/pft_stage/model-00014-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
61
+ cumo-mixtral-8x7b/pft_stage/training_args.bin filter=lfs diff=lfs merge=lfs -text
62
+ cumo-mixtral-8x7b/pft_stage/model-00007-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
63
+ cumo-mixtral-8x7b/pft_stage/model-00012-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
64
+ cumo-mixtral-8x7b/pft_stage/model-00016-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
65
+ cumo-mixtral-8x7b/pft_stage/model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
66
+ cumo-mixtral-8x7b/pft_stage/special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
67
+ cumo-mixtral-8x7b/pft_stage/model-00004-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
68
+ cumo-mixtral-8x7b/pft_stage/model-00008-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
69
+ cumo-mixtral-8x7b/pft_stage/model-00010-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
70
+ cumo-mixtral-8x7b/pft_stage/model-00006-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
71
+ cumo-mixtral-8x7b/pft_stage/model-00009-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
72
+ cumo-mixtral-8x7b/pft_stage/tokenizer.model filter=lfs diff=lfs merge=lfs -text
73
+ cumo-mixtral-8x7b/pft_stage/clip.bin filter=lfs diff=lfs merge=lfs -text
74
+ cumo-mixtral-8x7b/pft_stage/model-00001-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
75
+ cumo-mixtral-8x7b/pft_stage/model-00005-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
76
+ cumo-mixtral-8x7b/pft_stage/model-00013-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
77
+ cumo-mixtral-8x7b/pft_stage/model-00019-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
78
+ cumo-mixtral-8x7b/pft_stage/model-00017-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
79
+ cumo-mixtral-8x7b/pft_stage/config.json filter=lfs diff=lfs merge=lfs -text
80
+ cumo-mixtral-8x7b/pft_stage/mm_projector.bin filter=lfs diff=lfs merge=lfs -text
81
+ cumo-mixtral-8x7b/pft_stage/model-00002-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
82
+ cumo-mixtral-8x7b/pft_stage/trainer_state.json filter=lfs diff=lfs merge=lfs -text
83
+ cumo-mixtral-8x7b/pft_stage/model-00003-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
84
+ cumo-mixtral-8x7b/pft_stage/model-00015-of-00019.safetensors filter=lfs diff=lfs merge=lfs -text
85
+ cumo-mixtral-8x7b/pft_stage/tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
cumo-mixtral-8x7b/pft_stage/clip.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:611cb25503ba855083647abee8ff613234ebb474e41360c59ffebe9117a6019b
3
+ size 1214122445
cumo-mixtral-8x7b/pft_stage/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e83d1408c37ec73ba2c563e2dfbb280d773af76683a5a71d714abb2d72b6998e
3
+ size 1549
cumo-mixtral-8x7b/pft_stage/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e39d2130d0ad1e0663c1500e3e949848063444c146777aa0261a350e75b51ed7
3
+ size 132
cumo-mixtral-8x7b/pft_stage/mm_projector.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac20397ec3cd2b21d048cba3fb16a7172a16338ddff7cf7ad9f10f73f5f7192
3
+ size 100698168
cumo-mixtral-8x7b/pft_stage/model-00001-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da4324369397216e08c5e23de62e01508c10a00e121ebd70fd4f557973756978
3
+ size 4892809584
cumo-mixtral-8x7b/pft_stage/model-00002-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42531d55c481ab12ccbe3340b899f81528acc9bf27e45e92f8a7a4a7cfdb3e77
3
+ size 4983004016
cumo-mixtral-8x7b/pft_stage/model-00003-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4910740948899a8a9cc73d2b68087f795b463e2c718c6995ca1b249c39c9f2d8
3
+ size 4983004016
cumo-mixtral-8x7b/pft_stage/model-00004-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69798d9aba04ee5dbb657fd531055e06b4d65409b6c44abe0b1dad06616f9ee6
3
+ size 4899035200
cumo-mixtral-8x7b/pft_stage/model-00005-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfd9e097edfc233f6501bb3bb0f296b0a798af7c641bf8420957f9e06f5e760b
3
+ size 4983004016
cumo-mixtral-8x7b/pft_stage/model-00006-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f95754cf342b80301a9e123d77f3d36b734b0e3dba506cdbf453a44c21093b
3
+ size 4983004016
cumo-mixtral-8x7b/pft_stage/model-00007-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:022b78e679d0018a486f3b2247eba5d522776503d269e6047abe68eb41a13961
3
+ size 4899035248
cumo-mixtral-8x7b/pft_stage/model-00008-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf1625b9c3d70823243692579df555271b231c00cc1e0862357257007f6a748d
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00009-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f588d4346d4cbfec810cef01aa9179ff9846b999d7c4ea1a4e023305fc3afbc5
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00010-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:640555745d5c408a86387c39bbcbba28f328f748c48f30ca4a8e7730888d3c4f
3
+ size 4899035248
cumo-mixtral-8x7b/pft_stage/model-00011-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cbf76ac80c45bb7c006d0b69232c991db66fb6569e5af4251b2bcb9197560ef
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00012-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc81e1beef9a8c73a4a91b66388276e1c4897b34dfe7644d115fc81496bf18a0
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00013-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce59423afffa39c24453e5ae8f74eabf649aac6a251067768db96f0ca805774
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00014-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb30ddc4b0ba8e39d33a30e3424d8cd060a168dbf7703b16c8208132cc9f0aec
3
+ size 4899035248
cumo-mixtral-8x7b/pft_stage/model-00015-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:810a66a764e5b78ebdfdb7d00762f0280335b18643228c680dc6a0145ed88e33
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00016-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a28d31a22892f25c8d1f9f751421db28f5366e6769938892adb7c1aa75d38fc5
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00017-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03f0e07b28d967b40f25014e57e4da06aaa53545f59235fd5fe0537a54a59305
3
+ size 4899035248
cumo-mixtral-8x7b/pft_stage/model-00018-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d37aba6ed443104edb19640cfa30955d8444cfae2d19ce7bb70d454eb0a340e4
3
+ size 4983004072
cumo-mixtral-8x7b/pft_stage/model-00019-of-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6739453c10f6eb2db607bedb01814c64d76f361182b3406cc1ca33679d2d061
3
+ size 4879094400
cumo-mixtral-8x7b/pft_stage/model.safetensors.index.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87016246ffe4cf21d4073e49b96c9be022633897f4f5b09770301d9006084253
3
+ size 136585
cumo-mixtral-8x7b/pft_stage/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:719833ff26ac897a3ec8ed946028a135de2a351470af59b4008744ab1f0ee9b7
3
+ size 438
cumo-mixtral-8x7b/pft_stage/tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
cumo-mixtral-8x7b/pft_stage/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b517c3b2f923eb93532c182caf3db29e4dd163fae5d907a7763e6eb1050a5b6a
3
+ size 1463
cumo-mixtral-8x7b/pft_stage/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd88a936dbb79c438eb5a096ddc492d61bd3d71912cc5c018d812fbacc184440
3
+ size 670447
cumo-mixtral-8x7b/pft_stage/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e09ee22a52bdef6688e0d40b481f762d67db742ccd1d957e3200e5a4c92779a4
3
+ size 7608
cumo-mixtral-8x7b/pretrain_stage/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3879a84a4ffba9768eab98a78690a0242b54a97ff9c3c20455a61cea89de1c4
3
+ size 1546
cumo-mixtral-8x7b/pretrain_stage/mm_projector.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:920e94f89ada6b88d7b402ed0859d92d8d902837621088a9a1f75384014553d1
3
+ size 50350136
cumo-mixtral-8x7b/pretrain_stage/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:872dc5bb233ddb022208aa92655ce118ce6c6f5a4ff6c7f4f81f4392cc008ffd
3
+ size 263241