ZongqianLi commited on
Commit
8766291
1 Parent(s): ad1e2c7

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +26 -0
  2. global_step33600/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step33600/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step33600/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step33600/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step33600/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step33600/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step33600/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step33600/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step33600/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step33600/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step33600/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step33600/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step33600/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step33600/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step33600/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step33600/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step33600/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step33600/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step33600/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step33600/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step33600/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step33600/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step33600/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step33600/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step33600/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step33600/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step33600/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step33600/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step33600/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step33600/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step33600/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step33600/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step33600/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step33600/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step33600/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step33600/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step33600/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step33600/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step33600/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step33600/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step33600/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step33600/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step33600/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step33600/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step33600/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step33600/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step33600/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step33600/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step33600/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-base-uncased",
3
+ "architectures": [
4
+ "BertForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.25.1",
23
+ "type_vocab_size": 2,
24
+ "use_cache": true,
25
+ "vocab_size": 30522
26
+ }
global_step33600/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955ae842fc6cf286a06d27d0a9e636a331a2c71f6ecd3b3367e7d415e296e66d
3
+ size 32858723
global_step33600/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e9af21fca44d51329ee770c01892153de7918cfbf4ebb1f7d521d0e94abda6
3
+ size 32858723
global_step33600/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923
global_step33600/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae2da1b33a3106fc017ab855388e3760f5a4733ceb2a714eae79ab06bcc8ecd2
3
+ size 32858723
global_step33600/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1abfdb9d4846808a11c170e28a20824e2786fb140a9374812434f520d07c983
3
+ size 32858723
global_step33600/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4ba1e0ddc5a80d6212252b9c3d463d87495d80b7be95ab641022420cc421a31
3
+ size 32858723
global_step33600/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2b3891787416ff53bcadc4adb41d34d13588a2dd43ace17daf65a3741021bb8
3
+ size 32858723
global_step33600/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923
global_step33600/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e97067183bdfadeba97d1a18ab31947dd1e60b5f955eedd5d1e85e1a7c28553c
3
+ size 32858723
global_step33600/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2dbc793830bd73a8c866b3ce754035969057d6a31c214d6b16aaa68b68cc4ed
3
+ size 32858723
global_step33600/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c2d901aafe387d238c07bc3d2aef0caa8d00e881a11092381418be420f791e
3
+ size 32858723
global_step33600/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f2659a74d29cbbe76a0cd75998b5e932cab1af2463efac2f95b7f4a210ef14a
3
+ size 32858723
global_step33600/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923
global_step33600/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8c8f9cb2eb71e4b0e6ec0fcf29393e45809ad0046d234cb8ae1d6a5848c97a9
3
+ size 32858723
global_step33600/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:168f1fb2667b386790d8b9e0d5254f5243afa5c591121271a045a40860ed6b30
3
+ size 32858723
global_step33600/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b23e8626b9883f0f7b8bd23afddc22ccb94a6f841111d6422e2ed99ef89030
3
+ size 32858723
global_step33600/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef7502170e838a54dab28c53ed192636ee87889aa35a0801a87e3c432068c4e
3
+ size 32858723
global_step33600/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ede738de52f9dee1e2177b4a62f32e3bfe061be9b1e061736d2909483c4783a
3
+ size 32858723
global_step33600/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923
global_step33600/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e410129c36f21c8acf500bfc9213a3141722b5a6aa45a7f5921a0319a3c3438d
3
+ size 32858723
global_step33600/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e0a440d6ad5ac87a7b4849125d54f34c9c43f0b79e25d0bb96d7daed1d51b6
3
+ size 32858723
global_step33600/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:001c0f3a1491ea2c8e6cd459094b65875bf6a77fe4a540c8dc0b4d1d9e7efe95
3
+ size 32858723
global_step33600/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f98170d2509bf0dece5cbcf73cd9780d3142af7366433db763f5b90d8fc38f3
3
+ size 32858723
global_step33600/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923
global_step33600/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e81f3dc3d37d0c9ae1306666d56e799071ab5ebc4c3426451049e2a2e972be
3
+ size 32858723
global_step33600/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa3683bca71f4b10effa2808223c40f5504765b3bc757009e7138548041dab5
3
+ size 90923
global_step33600/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dc78bb670344f063f7638e3a8685dc9c17512bf7515723bcd7cf4367730f85c
3
+ size 32858723
global_step33600/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8670e646111417c0c6eed32d32e51f73ad9083989943f76a150101b6657e60e9
3
+ size 90923
global_step33600/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67fc3e82fa9f4ce9004d69540b45bead7182277b36360df5fb2f429dbd5e91d3
3
+ size 32858723
global_step33600/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d6738a1f6d59e166557d3089ffcb75ae6c21ae7aa1438790888400aa40c872
3
+ size 32858723
global_step33600/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef16f32a98873dc30875ff9412eaf33c53de5bc221b8d6c9c8a441bcde5042e1
3
+ size 90923
global_step33600/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe8b279d06f1ccc6ddb323552448937ae49db958d480bfdeb842fc8cb7224ee3
3
+ size 32858723
global_step33600/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1354f806c98bd8b248e4e58caa1433d54bd67cfa8e8d895879382e8b001c076a
3
+ size 90923