domenicrosati commited on
Commit
da39604
1 Parent(s): 5e832df

Training in progress, step 500

Browse files
Files changed (37) hide show
  1. .gitignore +1 -0
  2. added_tokens.json +3 -0
  3. config.json +35 -0
  4. pytorch_model.bin +3 -0
  5. runs/Jun29_20-22-09_n9orfgdtp5/1656534139.9433937/events.out.tfevents.1656534139.n9orfgdtp5.109.1 +3 -0
  6. runs/Jun29_20-22-09_n9orfgdtp5/events.out.tfevents.1656534139.n9orfgdtp5.109.0 +3 -0
  7. runs/Jun29_20-30-21_n9orfgdtp5/1656534625.96981/events.out.tfevents.1656534625.n9orfgdtp5.109.3 +3 -0
  8. runs/Jun29_20-30-21_n9orfgdtp5/1656534634.0046217/events.out.tfevents.1656534634.n9orfgdtp5.109.4 +3 -0
  9. runs/Jun29_20-30-21_n9orfgdtp5/1656534761.271622/events.out.tfevents.1656534761.n9orfgdtp5.109.5 +3 -0
  10. runs/Jun29_20-30-21_n9orfgdtp5/events.out.tfevents.1656534625.n9orfgdtp5.109.2 +3 -0
  11. runs/Jun29_20-34-27_n9orfgdtp5/1656534874.5505419/events.out.tfevents.1656534874.n9orfgdtp5.371.1 +3 -0
  12. runs/Jun29_20-34-27_n9orfgdtp5/1656535102.6915376/events.out.tfevents.1656535102.n9orfgdtp5.371.2 +3 -0
  13. runs/Jun29_20-34-27_n9orfgdtp5/events.out.tfevents.1656534874.n9orfgdtp5.371.0 +3 -0
  14. runs/Jun29_20-39-48_n9orfgdtp5/1656535193.259896/events.out.tfevents.1656535193.n9orfgdtp5.371.4 +3 -0
  15. runs/Jun29_20-39-48_n9orfgdtp5/events.out.tfevents.1656535193.n9orfgdtp5.371.3 +3 -0
  16. runs/Jun29_20-41-44_n9orfgdtp5/1656535335.807074/events.out.tfevents.1656535335.n9orfgdtp5.371.6 +3 -0
  17. runs/Jun29_20-41-44_n9orfgdtp5/events.out.tfevents.1656535335.n9orfgdtp5.371.5 +3 -0
  18. runs/Jun29_20-43-48_n9orfgdtp5/1656535435.43453/events.out.tfevents.1656535435.n9orfgdtp5.371.8 +3 -0
  19. runs/Jun29_20-43-48_n9orfgdtp5/events.out.tfevents.1656535435.n9orfgdtp5.371.7 +3 -0
  20. runs/Jun29_20-47-06_n9orfgdtp5/1656535633.1010277/events.out.tfevents.1656535633.n9orfgdtp5.597.1 +3 -0
  21. runs/Jun29_20-47-06_n9orfgdtp5/1656535656.6862278/events.out.tfevents.1656535656.n9orfgdtp5.597.2 +3 -0
  22. runs/Jun29_20-47-06_n9orfgdtp5/events.out.tfevents.1656535633.n9orfgdtp5.597.0 +3 -0
  23. runs/Jun29_20-52-12_n9orfgdtp5/1656535939.9731603/events.out.tfevents.1656535939.n9orfgdtp5.683.1 +3 -0
  24. runs/Jun29_20-52-12_n9orfgdtp5/events.out.tfevents.1656535939.n9orfgdtp5.683.0 +3 -0
  25. runs/Jun29_20-52-51_n9orfgdtp5/1656535976.221112/events.out.tfevents.1656535976.n9orfgdtp5.683.3 +3 -0
  26. runs/Jun29_20-52-51_n9orfgdtp5/events.out.tfevents.1656535976.n9orfgdtp5.683.2 +3 -0
  27. runs/Jun29_20-58-22_n9orfgdtp5/1656536309.9024267/events.out.tfevents.1656536309.n9orfgdtp5.835.1 +3 -0
  28. runs/Jun29_20-58-22_n9orfgdtp5/events.out.tfevents.1656536309.n9orfgdtp5.835.0 +3 -0
  29. runs/Jun29_21-02-48_n9orfgdtp5/1656536575.638863/events.out.tfevents.1656536575.n9orfgdtp5.936.1 +3 -0
  30. runs/Jun29_21-02-48_n9orfgdtp5/events.out.tfevents.1656536575.n9orfgdtp5.936.0 +3 -0
  31. runs/Jun29_21-19-58_n9orfgdtp5/1656537605.8520396/events.out.tfevents.1656537605.n9orfgdtp5.1021.1 +3 -0
  32. runs/Jun29_21-19-58_n9orfgdtp5/events.out.tfevents.1656537605.n9orfgdtp5.1021.0 +3 -0
  33. special_tokens_map.json +9 -0
  34. spm.model +3 -0
  35. tokenizer.json +0 -0
  36. tokenizer_config.json +16 -0
  37. training_args.bin +3 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/deberta-v3-xsmall",
3
+ "architectures": [
4
+ "DebertaV2ForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 384,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 1536,
12
+ "layer_norm_eps": 1e-07,
13
+ "max_position_embeddings": 512,
14
+ "max_relative_positions": -1,
15
+ "model_type": "deberta-v2",
16
+ "norm_rel_ebd": "layer_norm",
17
+ "num_attention_heads": 6,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "pooler_dropout": 0,
21
+ "pooler_hidden_act": "gelu",
22
+ "pooler_hidden_size": 384,
23
+ "pos_att_type": [
24
+ "p2c",
25
+ "c2p"
26
+ ],
27
+ "position_biased_input": false,
28
+ "position_buckets": 256,
29
+ "relative_attention": true,
30
+ "share_att_key": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.20.1",
33
+ "type_vocab_size": 0,
34
+ "vocab_size": 128100
35
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f240d3ee476217e3204f5d92f7df9868ac94feeca863dc3d3f20d38b358bd143
3
+ size 283908201
runs/Jun29_20-22-09_n9orfgdtp5/1656534139.9433937/events.out.tfevents.1656534139.n9orfgdtp5.109.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:638168aba3aef5c72d8058427b7fc06907089da5c20df839c5b67265b733919e
3
+ size 5409
runs/Jun29_20-22-09_n9orfgdtp5/events.out.tfevents.1656534139.n9orfgdtp5.109.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ede79d0523cfb70dac5994c88d3869a17395aa53ef84a2839084786f25b6a3df
3
+ size 3838
runs/Jun29_20-30-21_n9orfgdtp5/1656534625.96981/events.out.tfevents.1656534625.n9orfgdtp5.109.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e07bbbb78cf5b5f95aed3f527cd59daf70b77c81e9bd25980dcebb263eb61290
3
+ size 5409
runs/Jun29_20-30-21_n9orfgdtp5/1656534634.0046217/events.out.tfevents.1656534634.n9orfgdtp5.109.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2c01b7645c883431c39974c00aceeec4cf81c5d0614af15c14abb5ede53727e
3
+ size 5409
runs/Jun29_20-30-21_n9orfgdtp5/1656534761.271622/events.out.tfevents.1656534761.n9orfgdtp5.109.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a97fcae9404564b7a1d90fed7cac23ba4bf9c7e7069bd4b03f3bc52d02ae96f
3
+ size 5409
runs/Jun29_20-30-21_n9orfgdtp5/events.out.tfevents.1656534625.n9orfgdtp5.109.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:032ffce6b19201eeea638c3359b43b22155ac9bd9438cddfc8298ababb3799ed
3
+ size 11434
runs/Jun29_20-34-27_n9orfgdtp5/1656534874.5505419/events.out.tfevents.1656534874.n9orfgdtp5.371.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13a90890ddf87b9b49d8dd953a58040a3c8e7432eb3bda10f7664a66da610484
3
+ size 5409
runs/Jun29_20-34-27_n9orfgdtp5/1656535102.6915376/events.out.tfevents.1656535102.n9orfgdtp5.371.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:334e5e8cc723e1f530971aa1cc583f346f30bb2760100e1607d3db4e5927b1dc
3
+ size 5409
runs/Jun29_20-34-27_n9orfgdtp5/events.out.tfevents.1656534874.n9orfgdtp5.371.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:884287371f8573c7c028f74f39a4b7f9f41bf0087134b8e12dd76908d5ca70b2
3
+ size 7636
runs/Jun29_20-39-48_n9orfgdtp5/1656535193.259896/events.out.tfevents.1656535193.n9orfgdtp5.371.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2144634846b6d342a144cd080d8f86edcd6f6a45a66561d222c773c002636854
3
+ size 5409
runs/Jun29_20-39-48_n9orfgdtp5/events.out.tfevents.1656535193.n9orfgdtp5.371.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d0a94b85a3dd8e1c1fd77d50b55664b6830d015de5c29275383ab78547573e0
3
+ size 3838
runs/Jun29_20-41-44_n9orfgdtp5/1656535335.807074/events.out.tfevents.1656535335.n9orfgdtp5.371.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afce2c026337a2aa72a7bf4e0680abe5fca596b057dd62b95e6ea102cea1ced7
3
+ size 5409
runs/Jun29_20-41-44_n9orfgdtp5/events.out.tfevents.1656535335.n9orfgdtp5.371.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6fbf066ceac4f189067348eb41e1c3261be496c910ecf1939a2afe915a5eab9
3
+ size 3838
runs/Jun29_20-43-48_n9orfgdtp5/1656535435.43453/events.out.tfevents.1656535435.n9orfgdtp5.371.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3595233aa3c9b47470d4aac59de83582877d51a6c888dfef87fea701844c5817
3
+ size 5409
runs/Jun29_20-43-48_n9orfgdtp5/events.out.tfevents.1656535435.n9orfgdtp5.371.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8003348d9c1894de00d67b5529a9b27ead9347d78e56abc0b6344d75669208a2
3
+ size 3838
runs/Jun29_20-47-06_n9orfgdtp5/1656535633.1010277/events.out.tfevents.1656535633.n9orfgdtp5.597.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:329f80f51f5c96eb2148ca0a7fb57cee19a6ee64fc57a1978fe4cc0c7a0a7207
3
+ size 5409
runs/Jun29_20-47-06_n9orfgdtp5/1656535656.6862278/events.out.tfevents.1656535656.n9orfgdtp5.597.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d20af4e2664b560ccef28bb35b4bd2138c44d943b960272bb3191613a18d33a2
3
+ size 5409
runs/Jun29_20-47-06_n9orfgdtp5/events.out.tfevents.1656535633.n9orfgdtp5.597.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db9f692bdae8450959e099d6cb02c51e819b1c14f2b639961949e07065c93ce6
3
+ size 7636
runs/Jun29_20-52-12_n9orfgdtp5/1656535939.9731603/events.out.tfevents.1656535939.n9orfgdtp5.683.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be990b7376275e8fdf13712288fa8e45001435f701cccc69a17ca58f1bde302a
3
+ size 5409
runs/Jun29_20-52-12_n9orfgdtp5/events.out.tfevents.1656535939.n9orfgdtp5.683.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:231a87936fc53c6ecc21f8c461f3885f2378c3985d1b6e881b15590d6a77aa3b
3
+ size 3832
runs/Jun29_20-52-51_n9orfgdtp5/1656535976.221112/events.out.tfevents.1656535976.n9orfgdtp5.683.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:535d0392af2acaa8f0d72260915bb619f4f76b07aa33963427498cfa8f539616
3
+ size 5409
runs/Jun29_20-52-51_n9orfgdtp5/events.out.tfevents.1656535976.n9orfgdtp5.683.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93ec079e9a13540f65f942506ef10103642d4ec34b339d0cf0312b24701f0ad
3
+ size 3832
runs/Jun29_20-58-22_n9orfgdtp5/1656536309.9024267/events.out.tfevents.1656536309.n9orfgdtp5.835.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d53a9121a84142273d8b2e21edc5584aed22fb947a58fb0f487cb75fe7ddfe06
3
+ size 5409
runs/Jun29_20-58-22_n9orfgdtp5/events.out.tfevents.1656536309.n9orfgdtp5.835.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a6a2b265548bc544f3dd45ddcf21553182ec7eafdc21bb28a932362569ae779
3
+ size 3834
runs/Jun29_21-02-48_n9orfgdtp5/1656536575.638863/events.out.tfevents.1656536575.n9orfgdtp5.936.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc462d21aef55b7850caceb62fd0d7597f1b0c7ba0c4eb90f2d678266d5610a
3
+ size 5409
runs/Jun29_21-02-48_n9orfgdtp5/events.out.tfevents.1656536575.n9orfgdtp5.936.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f0aef438c2da0d255cf586d05542e00e3a50c5fd67a6935907e4eaab66b8ac
3
+ size 3993
runs/Jun29_21-19-58_n9orfgdtp5/1656537605.8520396/events.out.tfevents.1656537605.n9orfgdtp5.1021.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bbdbf93c96c3add6966ee4944d47a3fa3f6652e644cd67103fd3ef39fa9efd4
3
+ size 5409
runs/Jun29_21-19-58_n9orfgdtp5/events.out.tfevents.1656537605.n9orfgdtp5.1021.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:225c4e96ce6c29d003d8b1f3d1920cbb2a3ba54716f86dce8cfd0d0fcc371260
3
+ size 4316
special_tokens_map.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": "[UNK]"
9
+ }
spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": false,
5
+ "eos_token": "[SEP]",
6
+ "mask_token": "[MASK]",
7
+ "name_or_path": "microsoft/deberta-v3-xsmall",
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "sp_model_kwargs": {},
11
+ "special_tokens_map_file": null,
12
+ "split_by_punct": false,
13
+ "tokenizer_class": "DebertaV2Tokenizer",
14
+ "unk_token": "[UNK]",
15
+ "vocab_type": "spm"
16
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e76471a544091dc3684577abd643c5064b43521478926bb572cc3246a4fd47
3
+ size 3375