ZongqianLi commited on
Commit
501dc72
1 Parent(s): 8eeef79

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. global_step3180/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step3180/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step3180/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step3180/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step3180/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step3180/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step3180/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step3180/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step3180/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step3180/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step3180/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step3180/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step3180/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step3180/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step3180/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step3180/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step3180/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step3180/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step3180/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step3180/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step3180/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step3180/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step3180/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step3180/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step3180/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step3180/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step3180/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step3180/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step3180/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step3180/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step3180/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step3180/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step3180/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step3180/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step3180/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step3180/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step3180/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step3180/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step3180/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step3180/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step3180/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step3180/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step3180/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step3180/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step3180/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step3180/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step3180/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step3180/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step3180/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-large-cased",
3
+ "architectures": [
4
+ "BertForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 16,
19
+ "num_hidden_layers": 24,
20
+ "pad_token_id": 0,
21
+ "pooler_fc_size": 768,
22
+ "pooler_num_attention_heads": 12,
23
+ "pooler_num_fc_layers": 3,
24
+ "pooler_size_per_head": 128,
25
+ "pooler_type": "first_token_transform",
26
+ "position_embedding_type": "absolute",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.25.1",
29
+ "type_vocab_size": 2,
30
+ "use_cache": true,
31
+ "vocab_size": 28996
32
+ }
global_step3180/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8e3e698ba19593c54df524d6ee5750fa2bf62aa44bcfee127359a1f2030c33
3
+ size 100088099
global_step3180/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8dc9560fe01180aad72422e3fc3dbf77096cc713a173d1a0d92c1f7bbb8b2b9
3
+ size 100088099
global_step3180/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267
global_step3180/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80a883bbfe7b090d15002720e7ba33c63cad775cab6636bbdf6a41f653a0e499
3
+ size 100088099
global_step3180/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1444f2a29092ccb73019f2fc0cc7cf8179e221140671661244543e6774e181b3
3
+ size 100088099
global_step3180/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30beb04b7bd26293244e4747a0279b44a76df1ad393f0d6fd31d1ecdc2157495
3
+ size 100088099
global_step3180/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d64483f6f8a8de4fc99affebe9797b9a798f2d34ee251957b9dd8673e099180
3
+ size 100088099
global_step3180/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267
global_step3180/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33b8cfad76283bf821d3c09a844a670205c4d72754588c11f12443bc0b17e455
3
+ size 100088099
global_step3180/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44414d7edd56a3ae880b313c07532987b8d94aeacc45b569e12f71f46c4c22d5
3
+ size 100088099
global_step3180/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bc0ffc9800a9c31a52c5af3c829f6267b71bd1e72d26d01ae6dc4786704d7ba
3
+ size 100088099
global_step3180/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7417f4c8252fea66cb385279394e0ca99b5a0f510834475e3a08fe339c22624c
3
+ size 100088099
global_step3180/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267
global_step3180/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:181bb620acb427fe3311b2ddc0a39b18af0ac3ee559024fc73270ee11724d533
3
+ size 100088099
global_step3180/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3f4b39757ba5927a81612f7573671a8e56976dcbd7029fb7e7d426576fb3e6
3
+ size 100088099
global_step3180/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ca9e303e30fef19bd024d8ef1dcf4f482a74555fb06c03e7039e5d1a5f325d4
3
+ size 100088099
global_step3180/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:333e7d1e2edbdbb32bdd2bba17606aaf311024751ff211d31cdb94c9ee68fb0b
3
+ size 100088099
global_step3180/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b674ad2b11ce6eda818008e925ce4a5586396191377a793e5adba108baace44
3
+ size 100088099
global_step3180/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267
global_step3180/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab5d09fc04f687f77cbdab179ce01d41ff78fe8931ec55753d5b931793d88b2d
3
+ size 100088099
global_step3180/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c62b9e07c0b88fb1464ab1fbad67ae0d165e82c3020d6ad296d2c72ec81abd2d
3
+ size 100088099
global_step3180/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a9b8c05da0eb03443d84c750317bd6570adc26a84c9cb3631265c6d8a256e59
3
+ size 100088099
global_step3180/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f9d680cfe68ea80bd1ad3fe06a30f56dcedbb3d4a93e10a5bd67ac242e3dd63
3
+ size 100088099
global_step3180/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267
global_step3180/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b225dad6f8adcfb23db13640a2bf6afd6b19a72c07d3c640a02a2b18692db3e
3
+ size 100088099
global_step3180/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f07826684ba404c769499e0d2b5d1905d7a6739c28f771849d4c622c4f30c7b
3
+ size 172267
global_step3180/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99f502b3d8d60a884d2c6f59d1bf2a3d3ea06ee3d404c6149d36710abe9b3cd
3
+ size 100088099
global_step3180/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0b8f59f679943a3c5fa829d70540495b275d0482663d8aa26fd5bef3ee58d3
3
+ size 172267
global_step3180/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:859d9b38840bf4dcd4372e1b65fd5ff137fac421be43a92ed46a2d2ed2623431
3
+ size 100088099
global_step3180/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa4bde612e5b98429bfed5235657935deb8cb1ff0bc9a444104ccde0739cddb0
3
+ size 100088099
global_step3180/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6364edf9af2848d5f102d2df933571d585f1e30ac007ac3cd69d4c9544f56f99
3
+ size 172267
global_step3180/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52c534e39787ab18ce0a7575cd5d7829ccdbcf7730eb800571de017088e7b799
3
+ size 100088099
global_step3180/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66260a9a33f56e9fd30bce151a20392a9f36b5ef0cdeb566d4482fc47c3d178a
3
+ size 172267