domenicrosati
commited on
Commit
·
da39604
1
Parent(s):
5e832df
Training in progress, step 500
Browse files- .gitignore +1 -0
- added_tokens.json +3 -0
- config.json +35 -0
- pytorch_model.bin +3 -0
- runs/Jun29_20-22-09_n9orfgdtp5/1656534139.9433937/events.out.tfevents.1656534139.n9orfgdtp5.109.1 +3 -0
- runs/Jun29_20-22-09_n9orfgdtp5/events.out.tfevents.1656534139.n9orfgdtp5.109.0 +3 -0
- runs/Jun29_20-30-21_n9orfgdtp5/1656534625.96981/events.out.tfevents.1656534625.n9orfgdtp5.109.3 +3 -0
- runs/Jun29_20-30-21_n9orfgdtp5/1656534634.0046217/events.out.tfevents.1656534634.n9orfgdtp5.109.4 +3 -0
- runs/Jun29_20-30-21_n9orfgdtp5/1656534761.271622/events.out.tfevents.1656534761.n9orfgdtp5.109.5 +3 -0
- runs/Jun29_20-30-21_n9orfgdtp5/events.out.tfevents.1656534625.n9orfgdtp5.109.2 +3 -0
- runs/Jun29_20-34-27_n9orfgdtp5/1656534874.5505419/events.out.tfevents.1656534874.n9orfgdtp5.371.1 +3 -0
- runs/Jun29_20-34-27_n9orfgdtp5/1656535102.6915376/events.out.tfevents.1656535102.n9orfgdtp5.371.2 +3 -0
- runs/Jun29_20-34-27_n9orfgdtp5/events.out.tfevents.1656534874.n9orfgdtp5.371.0 +3 -0
- runs/Jun29_20-39-48_n9orfgdtp5/1656535193.259896/events.out.tfevents.1656535193.n9orfgdtp5.371.4 +3 -0
- runs/Jun29_20-39-48_n9orfgdtp5/events.out.tfevents.1656535193.n9orfgdtp5.371.3 +3 -0
- runs/Jun29_20-41-44_n9orfgdtp5/1656535335.807074/events.out.tfevents.1656535335.n9orfgdtp5.371.6 +3 -0
- runs/Jun29_20-41-44_n9orfgdtp5/events.out.tfevents.1656535335.n9orfgdtp5.371.5 +3 -0
- runs/Jun29_20-43-48_n9orfgdtp5/1656535435.43453/events.out.tfevents.1656535435.n9orfgdtp5.371.8 +3 -0
- runs/Jun29_20-43-48_n9orfgdtp5/events.out.tfevents.1656535435.n9orfgdtp5.371.7 +3 -0
- runs/Jun29_20-47-06_n9orfgdtp5/1656535633.1010277/events.out.tfevents.1656535633.n9orfgdtp5.597.1 +3 -0
- runs/Jun29_20-47-06_n9orfgdtp5/1656535656.6862278/events.out.tfevents.1656535656.n9orfgdtp5.597.2 +3 -0
- runs/Jun29_20-47-06_n9orfgdtp5/events.out.tfevents.1656535633.n9orfgdtp5.597.0 +3 -0
- runs/Jun29_20-52-12_n9orfgdtp5/1656535939.9731603/events.out.tfevents.1656535939.n9orfgdtp5.683.1 +3 -0
- runs/Jun29_20-52-12_n9orfgdtp5/events.out.tfevents.1656535939.n9orfgdtp5.683.0 +3 -0
- runs/Jun29_20-52-51_n9orfgdtp5/1656535976.221112/events.out.tfevents.1656535976.n9orfgdtp5.683.3 +3 -0
- runs/Jun29_20-52-51_n9orfgdtp5/events.out.tfevents.1656535976.n9orfgdtp5.683.2 +3 -0
- runs/Jun29_20-58-22_n9orfgdtp5/1656536309.9024267/events.out.tfevents.1656536309.n9orfgdtp5.835.1 +3 -0
- runs/Jun29_20-58-22_n9orfgdtp5/events.out.tfevents.1656536309.n9orfgdtp5.835.0 +3 -0
- runs/Jun29_21-02-48_n9orfgdtp5/1656536575.638863/events.out.tfevents.1656536575.n9orfgdtp5.936.1 +3 -0
- runs/Jun29_21-02-48_n9orfgdtp5/events.out.tfevents.1656536575.n9orfgdtp5.936.0 +3 -0
- runs/Jun29_21-19-58_n9orfgdtp5/1656537605.8520396/events.out.tfevents.1656537605.n9orfgdtp5.1021.1 +3 -0
- runs/Jun29_21-19-58_n9orfgdtp5/events.out.tfevents.1656537605.n9orfgdtp5.1021.0 +3 -0
- special_tokens_map.json +9 -0
- spm.model +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +16 -0
- training_args.bin +3 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[MASK]": 128000
|
3 |
+
}
|
config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "microsoft/deberta-v3-xsmall",
|
3 |
+
"architectures": [
|
4 |
+
"DebertaV2ForMaskedLM"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"hidden_act": "gelu",
|
8 |
+
"hidden_dropout_prob": 0.1,
|
9 |
+
"hidden_size": 384,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 1536,
|
12 |
+
"layer_norm_eps": 1e-07,
|
13 |
+
"max_position_embeddings": 512,
|
14 |
+
"max_relative_positions": -1,
|
15 |
+
"model_type": "deberta-v2",
|
16 |
+
"norm_rel_ebd": "layer_norm",
|
17 |
+
"num_attention_heads": 6,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pooler_dropout": 0,
|
21 |
+
"pooler_hidden_act": "gelu",
|
22 |
+
"pooler_hidden_size": 384,
|
23 |
+
"pos_att_type": [
|
24 |
+
"p2c",
|
25 |
+
"c2p"
|
26 |
+
],
|
27 |
+
"position_biased_input": false,
|
28 |
+
"position_buckets": 256,
|
29 |
+
"relative_attention": true,
|
30 |
+
"share_att_key": true,
|
31 |
+
"torch_dtype": "float32",
|
32 |
+
"transformers_version": "4.20.1",
|
33 |
+
"type_vocab_size": 0,
|
34 |
+
"vocab_size": 128100
|
35 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f240d3ee476217e3204f5d92f7df9868ac94feeca863dc3d3f20d38b358bd143
|
3 |
+
size 283908201
|
runs/Jun29_20-22-09_n9orfgdtp5/1656534139.9433937/events.out.tfevents.1656534139.n9orfgdtp5.109.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:638168aba3aef5c72d8058427b7fc06907089da5c20df839c5b67265b733919e
|
3 |
+
size 5409
|
runs/Jun29_20-22-09_n9orfgdtp5/events.out.tfevents.1656534139.n9orfgdtp5.109.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ede79d0523cfb70dac5994c88d3869a17395aa53ef84a2839084786f25b6a3df
|
3 |
+
size 3838
|
runs/Jun29_20-30-21_n9orfgdtp5/1656534625.96981/events.out.tfevents.1656534625.n9orfgdtp5.109.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e07bbbb78cf5b5f95aed3f527cd59daf70b77c81e9bd25980dcebb263eb61290
|
3 |
+
size 5409
|
runs/Jun29_20-30-21_n9orfgdtp5/1656534634.0046217/events.out.tfevents.1656534634.n9orfgdtp5.109.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2c01b7645c883431c39974c00aceeec4cf81c5d0614af15c14abb5ede53727e
|
3 |
+
size 5409
|
runs/Jun29_20-30-21_n9orfgdtp5/1656534761.271622/events.out.tfevents.1656534761.n9orfgdtp5.109.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a97fcae9404564b7a1d90fed7cac23ba4bf9c7e7069bd4b03f3bc52d02ae96f
|
3 |
+
size 5409
|
runs/Jun29_20-30-21_n9orfgdtp5/events.out.tfevents.1656534625.n9orfgdtp5.109.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:032ffce6b19201eeea638c3359b43b22155ac9bd9438cddfc8298ababb3799ed
|
3 |
+
size 11434
|
runs/Jun29_20-34-27_n9orfgdtp5/1656534874.5505419/events.out.tfevents.1656534874.n9orfgdtp5.371.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13a90890ddf87b9b49d8dd953a58040a3c8e7432eb3bda10f7664a66da610484
|
3 |
+
size 5409
|
runs/Jun29_20-34-27_n9orfgdtp5/1656535102.6915376/events.out.tfevents.1656535102.n9orfgdtp5.371.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:334e5e8cc723e1f530971aa1cc583f346f30bb2760100e1607d3db4e5927b1dc
|
3 |
+
size 5409
|
runs/Jun29_20-34-27_n9orfgdtp5/events.out.tfevents.1656534874.n9orfgdtp5.371.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:884287371f8573c7c028f74f39a4b7f9f41bf0087134b8e12dd76908d5ca70b2
|
3 |
+
size 7636
|
runs/Jun29_20-39-48_n9orfgdtp5/1656535193.259896/events.out.tfevents.1656535193.n9orfgdtp5.371.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2144634846b6d342a144cd080d8f86edcd6f6a45a66561d222c773c002636854
|
3 |
+
size 5409
|
runs/Jun29_20-39-48_n9orfgdtp5/events.out.tfevents.1656535193.n9orfgdtp5.371.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d0a94b85a3dd8e1c1fd77d50b55664b6830d015de5c29275383ab78547573e0
|
3 |
+
size 3838
|
runs/Jun29_20-41-44_n9orfgdtp5/1656535335.807074/events.out.tfevents.1656535335.n9orfgdtp5.371.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afce2c026337a2aa72a7bf4e0680abe5fca596b057dd62b95e6ea102cea1ced7
|
3 |
+
size 5409
|
runs/Jun29_20-41-44_n9orfgdtp5/events.out.tfevents.1656535335.n9orfgdtp5.371.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6fbf066ceac4f189067348eb41e1c3261be496c910ecf1939a2afe915a5eab9
|
3 |
+
size 3838
|
runs/Jun29_20-43-48_n9orfgdtp5/1656535435.43453/events.out.tfevents.1656535435.n9orfgdtp5.371.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3595233aa3c9b47470d4aac59de83582877d51a6c888dfef87fea701844c5817
|
3 |
+
size 5409
|
runs/Jun29_20-43-48_n9orfgdtp5/events.out.tfevents.1656535435.n9orfgdtp5.371.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8003348d9c1894de00d67b5529a9b27ead9347d78e56abc0b6344d75669208a2
|
3 |
+
size 3838
|
runs/Jun29_20-47-06_n9orfgdtp5/1656535633.1010277/events.out.tfevents.1656535633.n9orfgdtp5.597.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:329f80f51f5c96eb2148ca0a7fb57cee19a6ee64fc57a1978fe4cc0c7a0a7207
|
3 |
+
size 5409
|
runs/Jun29_20-47-06_n9orfgdtp5/1656535656.6862278/events.out.tfevents.1656535656.n9orfgdtp5.597.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d20af4e2664b560ccef28bb35b4bd2138c44d943b960272bb3191613a18d33a2
|
3 |
+
size 5409
|
runs/Jun29_20-47-06_n9orfgdtp5/events.out.tfevents.1656535633.n9orfgdtp5.597.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db9f692bdae8450959e099d6cb02c51e819b1c14f2b639961949e07065c93ce6
|
3 |
+
size 7636
|
runs/Jun29_20-52-12_n9orfgdtp5/1656535939.9731603/events.out.tfevents.1656535939.n9orfgdtp5.683.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be990b7376275e8fdf13712288fa8e45001435f701cccc69a17ca58f1bde302a
|
3 |
+
size 5409
|
runs/Jun29_20-52-12_n9orfgdtp5/events.out.tfevents.1656535939.n9orfgdtp5.683.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:231a87936fc53c6ecc21f8c461f3885f2378c3985d1b6e881b15590d6a77aa3b
|
3 |
+
size 3832
|
runs/Jun29_20-52-51_n9orfgdtp5/1656535976.221112/events.out.tfevents.1656535976.n9orfgdtp5.683.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:535d0392af2acaa8f0d72260915bb619f4f76b07aa33963427498cfa8f539616
|
3 |
+
size 5409
|
runs/Jun29_20-52-51_n9orfgdtp5/events.out.tfevents.1656535976.n9orfgdtp5.683.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d93ec079e9a13540f65f942506ef10103642d4ec34b339d0cf0312b24701f0ad
|
3 |
+
size 3832
|
runs/Jun29_20-58-22_n9orfgdtp5/1656536309.9024267/events.out.tfevents.1656536309.n9orfgdtp5.835.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d53a9121a84142273d8b2e21edc5584aed22fb947a58fb0f487cb75fe7ddfe06
|
3 |
+
size 5409
|
runs/Jun29_20-58-22_n9orfgdtp5/events.out.tfevents.1656536309.n9orfgdtp5.835.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a6a2b265548bc544f3dd45ddcf21553182ec7eafdc21bb28a932362569ae779
|
3 |
+
size 3834
|
runs/Jun29_21-02-48_n9orfgdtp5/1656536575.638863/events.out.tfevents.1656536575.n9orfgdtp5.936.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fc462d21aef55b7850caceb62fd0d7597f1b0c7ba0c4eb90f2d678266d5610a
|
3 |
+
size 5409
|
runs/Jun29_21-02-48_n9orfgdtp5/events.out.tfevents.1656536575.n9orfgdtp5.936.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9f0aef438c2da0d255cf586d05542e00e3a50c5fd67a6935907e4eaab66b8ac
|
3 |
+
size 3993
|
runs/Jun29_21-19-58_n9orfgdtp5/1656537605.8520396/events.out.tfevents.1656537605.n9orfgdtp5.1021.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bbdbf93c96c3add6966ee4944d47a3fa3f6652e644cd67103fd3ef39fa9efd4
|
3 |
+
size 5409
|
runs/Jun29_21-19-58_n9orfgdtp5/events.out.tfevents.1656537605.n9orfgdtp5.1021.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:225c4e96ce6c29d003d8b1f3d1920cbb2a3ba54716f86dce8cfd0d0fcc371260
|
3 |
+
size 4316
|
special_tokens_map.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "[CLS]",
|
3 |
+
"cls_token": "[CLS]",
|
4 |
+
"eos_token": "[SEP]",
|
5 |
+
"mask_token": "[MASK]",
|
6 |
+
"pad_token": "[PAD]",
|
7 |
+
"sep_token": "[SEP]",
|
8 |
+
"unk_token": "[UNK]"
|
9 |
+
}
|
spm.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
|
3 |
+
size 2464616
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "[CLS]",
|
3 |
+
"cls_token": "[CLS]",
|
4 |
+
"do_lower_case": false,
|
5 |
+
"eos_token": "[SEP]",
|
6 |
+
"mask_token": "[MASK]",
|
7 |
+
"name_or_path": "microsoft/deberta-v3-xsmall",
|
8 |
+
"pad_token": "[PAD]",
|
9 |
+
"sep_token": "[SEP]",
|
10 |
+
"sp_model_kwargs": {},
|
11 |
+
"special_tokens_map_file": null,
|
12 |
+
"split_by_punct": false,
|
13 |
+
"tokenizer_class": "DebertaV2Tokenizer",
|
14 |
+
"unk_token": "[UNK]",
|
15 |
+
"vocab_type": "spm"
|
16 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69e76471a544091dc3684577abd643c5064b43521478926bb572cc3246a4fd47
|
3 |
+
size 3375
|