VictorSanh commited on
Commit
c604e0f
1 Parent(s): fd643bd

End of training

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +9 -5
  2. adapter_config.json +12 -1
  3. adapter_model.safetensors +2 -2
  4. global_step1851/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  5. global_step1851/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step1851/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  7. global_step1851/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  8. global_step1851/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  9. global_step1851/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  10. global_step1851/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  11. global_step1851/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  12. global_step1851/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  13. global_step1851/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  14. global_step1851/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  15. global_step1851/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  16. global_step1851/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  17. global_step1851/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  18. global_step1851/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  19. global_step1851/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  20. global_step1851/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  21. global_step1851/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  22. global_step1851/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  23. global_step1851/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  24. global_step1851/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  25. global_step1851/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  26. global_step1851/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  27. global_step1851/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  28. global_step1851/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
  29. global_step1851/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  30. global_step1851/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
  31. global_step1851/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +3 -0
  32. global_step1851/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +3 -0
  33. global_step1851/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +3 -0
  34. global_step1851/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +3 -0
  35. global_step1851/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +3 -0
  36. global_step1851/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  37. global_step1851/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  38. global_step1851/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  39. global_step1851/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  40. global_step1851/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  41. global_step1851/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  42. global_step1851/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  43. global_step1851/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  44. global_step1851/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  45. global_step1851/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  46. global_step1851/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  47. global_step1851/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  48. global_step1851/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  49. global_step1851/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  50. global_step1851/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
README.md CHANGED
@@ -33,14 +33,18 @@ More information needed
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
- - learning_rate: 0.001
37
  - train_batch_size: 2
38
  - eval_batch_size: 8
39
  - seed: 42
 
 
 
 
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
- - lr_scheduler_warmup_steps: 1
43
- - num_epochs: 1
44
 
45
  ### Training results
46
 
@@ -48,8 +52,8 @@ The following hyperparameters were used during training:
48
 
49
  ### Framework versions
50
 
51
- - PEFT 0.9.0
52
  - Transformers 4.41.0.dev0
53
- - Pytorch 2.1.2+cu118
54
  - Datasets 2.14.7
55
  - Tokenizers 0.19.1
 
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
+ - learning_rate: 0.0001
37
  - train_batch_size: 2
38
  - eval_batch_size: 8
39
  - seed: 42
40
+ - distributed_type: multi-GPU
41
+ - num_devices: 32
42
+ - total_train_batch_size: 64
43
+ - total_eval_batch_size: 256
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
+ - lr_scheduler_warmup_steps: 150
47
+ - num_epochs: 3
48
 
49
  ### Training results
50
 
 
52
 
53
  ### Framework versions
54
 
55
+ - PEFT 0.8.2
56
  - Transformers 4.41.0.dev0
57
+ - Pytorch 2.0.1+cu118
58
  - Datasets 2.14.7
59
  - Tokenizers 0.19.1
adapter_config.json CHANGED
@@ -21,7 +21,18 @@
21
  "r": 8,
22
  "rank_pattern": {},
23
  "revision": null,
24
- "target_modules": ".*(vision_model|modality_projection).*(down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj|out_proj|fc1|fc2).*$",
 
 
 
 
 
 
 
 
 
 
 
25
  "task_type": null,
26
  "use_dora": true,
27
  "use_rslora": false
 
21
  "r": 8,
22
  "rank_pattern": {},
23
  "revision": null,
24
+ "target_modules": [
25
+ "fc1",
26
+ "down_proj",
27
+ "v_proj",
28
+ "fc2",
29
+ "q_proj",
30
+ "gate_proj",
31
+ "up_proj",
32
+ "k_proj",
33
+ "out_proj",
34
+ "o_proj"
35
+ ],
36
  "task_type": null,
37
  "use_dora": true,
38
  "use_rslora": false
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52d837bec138c69794cc2273939e86b8800ad8ca8894ea91f4b467fd888f06ba
3
- size 10170512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44ce263e6fd885f50d82ca515b9325375b43ee36ededb75acf161ce88bc2e41
3
+ size 48
global_step1851/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:025b1cd5afbca8d38f5c47b3cfa0228d14de98d80bf3d7dd5e7eb3792c25f2bd
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d952918d209940accbb6b6760be3aeaff64ea5f48b9013ce3b02dc088eae41f
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b48e6c001144fecc9cf24d6c0234aaa8f57cbb6546fb301452e3183a44c3641
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f41afe7b754464fa6f66f38795a12471f2e8797aec0226deb2f58be8b5bf83d2
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19db86359349ad86ed7bc9fa2ac6785d527c213c5060d30573aa725a60f3c08
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5270cb7c4b931ba77e4ae3179412d47b28d319b4c9e3007368bc63919eed4f02
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2986af12f9b1e5b1635139fbf4a19c5fe7eb2d34650d78879a887af731ae0edc
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffb257e34930ba938b49a5890a8454cb3267493523c68badfb3e8caa3afa0984
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30b14cc55558232a05c86540694a3306d830228bfb73ada754159eab17530ccb
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bc88792755a9da0da4e14d653531861fdd73db813b681f5782ec1d1a4b4fbbb
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1ccfee04a1de5af9afc9bf807e491ae6fa445afc90d08f2478c5c23668ada51
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ac4aae4488ba4c5323e8d76bb0d80f94103fc7d1d4fb43f3518976865b3ee76
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21f3d8ca5a232578f84f269ec2411b9eb2b49f87d60a6c5e3b753c832df4afb
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f07f1c42880fa800c5c5014d57bad92bb104337262d4be0048f9945442bf9df3
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99cac8d7f6437d6a2ae851c0404ba1f45b672ba92302b71c6c4a5534f7e3c9eb
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e12cd939152eac3931f1d1718ffc59378cbdf8173831e63d4c30d338b5560ca
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b214204ac9205421e0da3948f11bd9fe3c7fd39f91ec1be34d37701802444dc4
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3c3f9a89d26fa299bcf0f43ebc82958ce6b1bbae886b10a167d41c8edbe3e3d
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d557f242ecefbd95d1e660b8f5657abbbdb80ff8187f641c64780e1ae387841
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebb17752213250f062cab0d3a0668fc2c267071bfa8ff63947dfa3bb19e5953c
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6555304629e1a3d37cefe0b2220e0d2f2d780e1a96ea1f280f0f2b13396f4e33
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc525ebc87c1f7aa58d60a510d2aa0ab9518d5c8bf6233caa3d14555e78417e5
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:920f2e69684990176b3380c873136767031d3c5b72ca3f2daee75ad1875fecc0
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4baed8cbc04198e4e73835a48a65a53f4edc654b3a24b1c73b3f5d8624e4174a
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a23982b6bc7a206a97855ce54f5d6ad0c568f6a055d2663d88687228bda7d6bd
3
+ size 11065661
global_step1851/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90b5f73da5763d8bd618db0dbad365aad25216bc27f8afae03ee4660096112dd
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16bcf9ac0b62036551b8acbc9db9b3c1eb0358b58319bc6b976223b0c6243457
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80c3f3b0535b060821b883c728f18955902716d2718d5e741ffd223bf002d8a6
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bf8b9e5f6e87e3f78eb6202c28bb3c559e66a83f3f51b1b57242c738e7e3282
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6838931b32868aae01141d6f194e8302bf8d9a84ca685302d59280ab58466e4f
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a56344a10b279fadb8d0d141b60209e77c02449e61f154b329f29716691c32d2
3
+ size 11065655
global_step1851/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76827fa3b7dad13afd552e09d03fe62c1aa41a48f7d55e9b170a50cafa6b4ec4
3
+ size 11065655
global_step1851/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93b3877dd23615af54355e8c7c39550729cec91b78fde54ea0ef6a4a3fee65b
3
+ size 526932687
global_step1851/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d51aa79247167cab6c12bc19d50868cf6e463b2777ce76651c461044e0bc46b
3
+ size 526935445
global_step1851/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce906b0d6b350a48c983d1ce236c363ae0823a4c8d71f9cfaee7883b191be4d4
3
+ size 526935445
global_step1851/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bec42fd58898de452f3986ca86f2f05eacb3ed429e8e4b48b79f59626707180d
3
+ size 526935445
global_step1851/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9521594521b888df18bc98094ae9d6d12e620f63587ca9ad94141b25b0e2f80
3
+ size 526935445
global_step1851/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db95b3cc74d30eb5fa45d5e7e6b8b02d64719fa34afe27b597ff84a3becd9be8
3
+ size 526935445
global_step1851/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eab529ea20ced93e80dca7ecab4c69a05e748341f0259daaf863895a288f1e83
3
+ size 526935445
global_step1851/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f7f1a538fdd8f7665cc455c03bdd8f6c1b8bb15062048f748ceba7f3e99dd53
3
+ size 526935445
global_step1851/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc00c0885cdddde76db513e739f58456e95a255fe0a9d4f009463079ed0b102e
3
+ size 526935445
global_step1851/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d73143ba31897864028bc99357fb7b6432573df23106a13f343bb971ee88ff9
3
+ size 526935445
global_step1851/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d05a6d71b9bb4d67a0941daf6834d79d8f7ad7d77cdd0fa9f5c58aec902f9d01
3
+ size 526935445
global_step1851/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd26f545bbaf53db05106c2d762f978c218701550b8742c63fd6569097fca55
3
+ size 526932687
global_step1851/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f69acd690339f4e607dc2ed0be2f448a55cd6b14f0ec223d7fcb37bc2e8edcfd
3
+ size 526935445
global_step1851/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48a5abec20e07c4989d51c3b011a577aea82c3d56a50ac65eb1f534e40350060
3
+ size 526935445
global_step1851/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d09274d1752934484470667d48d5b5738b7ca64408882b1550526fcbfc9daa5
3
+ size 526935445