domenicrosati commited on
Commit
8777d66
·
1 Parent(s): c45019b

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"[MASK]": 128000}
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/deberta-v3-xsmall",
3
+ "architectures": [
4
+ "DebertaV2ForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 384,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 1536,
12
+ "layer_norm_eps": 1e-07,
13
+ "max_position_embeddings": 512,
14
+ "max_relative_positions": -1,
15
+ "model_type": "deberta-v2",
16
+ "norm_rel_ebd": "layer_norm",
17
+ "num_attention_heads": 6,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "pooler_dropout": 0,
21
+ "pooler_hidden_act": "gelu",
22
+ "pooler_hidden_size": 384,
23
+ "pos_att_type": [
24
+ "p2c",
25
+ "c2p"
26
+ ],
27
+ "position_biased_input": false,
28
+ "position_buckets": 256,
29
+ "relative_attention": true,
30
+ "share_att_key": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.18.0",
33
+ "type_vocab_size": 0,
34
+ "vocab_size": 128100
35
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:638ae7a82064a32d0b8d3998502a558e581beddbd061723159258f005631577b
3
+ size 283395115
runs/Jun24_23-00-52_5439eaefa85f/1656111666.1640413/events.out.tfevents.1656111666.5439eaefa85f.33.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b62d29be7937c01bfd0cedb5f05aebbecca44433278748aeefdf3957aa29fb44
3
+ size 4905
runs/Jun24_23-00-52_5439eaefa85f/events.out.tfevents.1656111666.5439eaefa85f.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:183edc99348b449622f04094744aa7c32e1ac77427b34e59ef1567741d793b9d
3
+ size 40
runs/Jun24_23-03-04_5439eaefa85f/1656111791.7679906/events.out.tfevents.1656111791.5439eaefa85f.517.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2233cd746f73fe71468767568ff8e4767b2f89693bd867ebdf0290ff357c43
3
+ size 4905
runs/Jun24_23-03-04_5439eaefa85f/events.out.tfevents.1656111791.5439eaefa85f.517.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f3f288d1cfda55daf843eda710c09465b16c7c26da0ecb6ec4799e8c8338250
3
+ size 40
runs/Jun24_23-05-16_5439eaefa85f/1656111924.0096588/events.out.tfevents.1656111924.5439eaefa85f.713.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbd3ef1e11570ebd2b2912c006d4bf530cb641e65a4becb8af50a75d2452d80
3
+ size 4905
runs/Jun24_23-05-16_5439eaefa85f/events.out.tfevents.1656111923.5439eaefa85f.713.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf9af744613e7c65005250ad955236a0a1272ed7118f2de0b1c954a52d20ced6
3
+ size 3554
runs/Jun24_23-08-48_5439eaefa85f/1656112136.514852/events.out.tfevents.1656112136.5439eaefa85f.960.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:061ecd6012ed8da96e787d8cca97fb1633a5c0efbe64438d821843c7849b2229
3
+ size 4905
runs/Jun24_23-08-48_5439eaefa85f/events.out.tfevents.1656112136.5439eaefa85f.960.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f54397e4d470bcf99eef2b4e55f323e0de141e06718725d4905b07a0cdfe7c
3
+ size 4080
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "split_by_punct": false, "sp_model_kwargs": {}, "vocab_type": "spm", "special_tokens_map_file": null, "name_or_path": "microsoft/deberta-v3-xsmall", "tokenizer_class": "DebertaV2Tokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235e2348ef081352eb757957c79778d149c30e625407c1aee6716305fd0b4262
3
+ size 3183