Gladiator commited on
Commit
c724aa1
1 Parent(s): 8754344

Training in progress, epoch 1

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
config.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/deberta-v3-large",
3
+ "architectures": [
4
+ "DebertaV2ForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "hidden_act": "gelu",
8
+ "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 1024,
10
+ "id2label": {
11
+ "0": "O",
12
+ "1": "B-corporation",
13
+ "2": "I-corporation",
14
+ "3": "B-creative-work",
15
+ "4": "I-creative-work",
16
+ "5": "B-group",
17
+ "6": "I-group",
18
+ "7": "B-location",
19
+ "8": "I-location",
20
+ "9": "B-person",
21
+ "10": "I-person",
22
+ "11": "B-product",
23
+ "12": "I-product"
24
+ },
25
+ "initializer_range": 0.02,
26
+ "intermediate_size": 4096,
27
+ "label2id": {
28
+ "B-corporation": 1,
29
+ "B-creative-work": 3,
30
+ "B-group": 5,
31
+ "B-location": 7,
32
+ "B-person": 9,
33
+ "B-product": 11,
34
+ "I-corporation": 2,
35
+ "I-creative-work": 4,
36
+ "I-group": 6,
37
+ "I-location": 8,
38
+ "I-person": 10,
39
+ "I-product": 12,
40
+ "O": 0
41
+ },
42
+ "layer_norm_eps": 1e-07,
43
+ "max_position_embeddings": 512,
44
+ "max_relative_positions": -1,
45
+ "model_type": "deberta-v2",
46
+ "norm_rel_ebd": "layer_norm",
47
+ "num_attention_heads": 16,
48
+ "num_hidden_layers": 24,
49
+ "pad_token_id": 0,
50
+ "pooler_dropout": 0,
51
+ "pooler_hidden_act": "gelu",
52
+ "pooler_hidden_size": 1024,
53
+ "pos_att_type": [
54
+ "p2c",
55
+ "c2p"
56
+ ],
57
+ "position_biased_input": false,
58
+ "position_buckets": 256,
59
+ "relative_attention": true,
60
+ "share_att_key": true,
61
+ "torch_dtype": "float32",
62
+ "transformers_version": "4.20.1",
63
+ "type_vocab_size": 0,
64
+ "vocab_size": 128100
65
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d9e0e2bc206b9e1d599d906a36f27193fde05536aad690e87485485c86b0242
3
+ size 1736239407
runs/Dec08_18-40-00_903e296f2d0b/1670524811.4986372/events.out.tfevents.1670524811.903e296f2d0b.24.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea5742ea0eedcaf70cb478c7b14a68fc4025bde43339274e73a3e18c1f968640
3
+ size 5407
runs/Dec08_18-40-00_903e296f2d0b/events.out.tfevents.1670524811.903e296f2d0b.24.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba37ef61ae3dd551cd1a699594e99d43317194b6a0249a3e4a69c894387f8fcd
3
+ size 4914
special_tokens_map.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": "[UNK]"
9
+ }
spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": false,
5
+ "eos_token": "[SEP]",
6
+ "mask_token": "[MASK]",
7
+ "name_or_path": "microsoft/deberta-v3-large",
8
+ "pad_token": "[PAD]",
9
+ "sep_token": "[SEP]",
10
+ "sp_model_kwargs": {},
11
+ "special_tokens_map_file": null,
12
+ "split_by_punct": false,
13
+ "tokenizer_class": "DebertaV2Tokenizer",
14
+ "unk_token": "[UNK]",
15
+ "vocab_type": "spm"
16
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8d523fd67e5fea3898e6f64bc1d39df2459c217c46e0d3d60f6489bf1230a68
3
+ size 3375