KoichiYasuoka commited on
Commit
1d6c0f4
1 Parent(s): d8dc46d

model improved

Browse files
Files changed (1) hide show
  1. config.json +100 -99
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "RobertaForTokenClassification"
4
  ],
@@ -10,108 +11,108 @@
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 256,
12
  "id2label": {
13
- "0": "I-ADJ",
14
- "1": "I-NUM",
15
- "2": "I-ADV",
16
- "3": "B-ADP",
17
- "4": "I-NOUN",
18
- "5": "I-DET",
19
- "6": "B-ADV",
20
- "7": "I-VERB",
21
- "8": "VERB",
22
- "9": "I-CCONJ",
23
- "10": "AUX",
24
- "11": "I-SCONJ",
25
- "12": "B-DET",
26
- "13": "B-ADJ",
27
- "14": "I-PART",
28
- "15": "ADV",
29
- "16": "B-INTJ",
30
- "17": "X",
31
- "18": "CCONJ",
32
- "19": "NOUN",
33
- "20": "B-AUX",
34
- "21": "INTJ",
35
- "22": "B-SYM",
36
- "23": "SCONJ",
37
- "24": "I-INTJ",
38
- "25": "ADJ",
39
- "26": "B-PRON",
40
- "27": "B-X",
41
- "28": "DET",
42
- "29": "SYM",
43
- "30": "I-PRON",
44
- "31": "I-SYM",
45
- "32": "PUNCT",
46
- "33": "I-PROPN",
47
- "34": "I-AUX",
48
- "35": "PART",
49
- "36": "B-NUM",
50
- "37": "I-X",
51
- "38": "B-SCONJ",
52
- "39": "B-PROPN",
53
- "40": "B-PART",
54
- "41": "I-ADP",
55
- "42": "B-VERB",
56
- "43": "ADP",
57
- "44": "PROPN",
58
- "45": "B-NOUN",
59
- "46": "PRON",
60
- "47": "B-CCONJ",
61
- "48": "NUM"
62
  },
63
  "initializer_range": 0.02,
64
  "intermediate_size": 768,
65
  "label2id": {
66
- "ADJ": 25,
67
- "ADP": 43,
68
- "ADV": 15,
69
- "AUX": 10,
70
- "B-ADJ": 13,
71
- "B-ADP": 3,
72
- "B-ADV": 6,
73
- "B-AUX": 20,
74
- "B-CCONJ": 47,
75
- "B-DET": 12,
76
- "B-INTJ": 16,
77
- "B-NOUN": 45,
78
- "B-NUM": 36,
79
- "B-PART": 40,
80
- "B-PRON": 26,
81
- "B-PROPN": 39,
82
- "B-SCONJ": 38,
83
- "B-SYM": 22,
84
- "B-VERB": 42,
85
- "B-X": 27,
86
- "CCONJ": 18,
87
- "DET": 28,
88
- "I-ADJ": 0,
89
- "I-ADP": 41,
90
- "I-ADV": 2,
91
- "I-AUX": 34,
92
- "I-CCONJ": 9,
93
- "I-DET": 5,
94
- "I-INTJ": 24,
95
- "I-NOUN": 4,
96
- "I-NUM": 1,
97
- "I-PART": 14,
98
- "I-PRON": 30,
99
- "I-PROPN": 33,
100
- "I-SCONJ": 11,
101
- "I-SYM": 31,
102
- "I-VERB": 7,
103
- "I-X": 37,
104
- "INTJ": 21,
105
- "NOUN": 19,
106
- "NUM": 48,
107
- "PART": 35,
108
- "PRON": 46,
109
- "PROPN": 44,
110
- "PUNCT": 32,
111
- "SCONJ": 23,
112
- "SYM": 29,
113
- "VERB": 8,
114
- "X": 17
115
  },
116
  "layer_norm_eps": 1e-12,
117
  "max_position_embeddings": 128,
@@ -122,7 +123,7 @@
122
  "position_embedding_type": "absolute",
123
  "tokenizer_class": "RemBertTokenizerFast",
124
  "torch_dtype": "float32",
125
- "transformers_version": "4.12.2",
126
  "type_vocab_size": 2,
127
  "use_cache": true,
128
  "vocab_size": 250315
 
1
  {
2
+ "_name_or_path": "KoichiYasuoka/roberta-small-japanese-aozora",
3
  "architectures": [
4
  "RobertaForTokenClassification"
5
  ],
 
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 256,
13
  "id2label": {
14
+ "0": "SCONJ",
15
+ "1": "B-VERB",
16
+ "2": "I-SCONJ",
17
+ "3": "VERB",
18
+ "4": "B-AUX",
19
+ "5": "PART",
20
+ "6": "I-ADJ",
21
+ "7": "I-ADP",
22
+ "8": "B-NOUN",
23
+ "9": "PRON",
24
+ "10": "B-ADP",
25
+ "11": "NOUN",
26
+ "12": "NUM",
27
+ "13": "PUNCT",
28
+ "14": "B-X",
29
+ "15": "CCONJ",
30
+ "16": "ADV",
31
+ "17": "B-PRON",
32
+ "18": "I-PRON",
33
+ "19": "I-NOUN",
34
+ "20": "B-ADV",
35
+ "21": "AUX",
36
+ "22": "ADP",
37
+ "23": "I-NUM",
38
+ "24": "B-DET",
39
+ "25": "I-X",
40
+ "26": "B-PART",
41
+ "27": "I-DET",
42
+ "28": "B-INTJ",
43
+ "29": "INTJ",
44
+ "30": "B-NUM",
45
+ "31": "I-VERB",
46
+ "32": "I-ADV",
47
+ "33": "I-AUX",
48
+ "34": "B-PROPN",
49
+ "35": "B-SYM",
50
+ "36": "I-PART",
51
+ "37": "I-INTJ",
52
+ "38": "X",
53
+ "39": "I-PROPN",
54
+ "40": "B-ADJ",
55
+ "41": "DET",
56
+ "42": "SYM",
57
+ "43": "ADJ",
58
+ "44": "B-SCONJ",
59
+ "45": "B-CCONJ",
60
+ "46": "PROPN",
61
+ "47": "I-CCONJ",
62
+ "48": "I-SYM"
63
  },
64
  "initializer_range": 0.02,
65
  "intermediate_size": 768,
66
  "label2id": {
67
+ "ADJ": 43,
68
+ "ADP": 22,
69
+ "ADV": 16,
70
+ "AUX": 21,
71
+ "B-ADJ": 40,
72
+ "B-ADP": 10,
73
+ "B-ADV": 20,
74
+ "B-AUX": 4,
75
+ "B-CCONJ": 45,
76
+ "B-DET": 24,
77
+ "B-INTJ": 28,
78
+ "B-NOUN": 8,
79
+ "B-NUM": 30,
80
+ "B-PART": 26,
81
+ "B-PRON": 17,
82
+ "B-PROPN": 34,
83
+ "B-SCONJ": 44,
84
+ "B-SYM": 35,
85
+ "B-VERB": 1,
86
+ "B-X": 14,
87
+ "CCONJ": 15,
88
+ "DET": 41,
89
+ "I-ADJ": 6,
90
+ "I-ADP": 7,
91
+ "I-ADV": 32,
92
+ "I-AUX": 33,
93
+ "I-CCONJ": 47,
94
+ "I-DET": 27,
95
+ "I-INTJ": 37,
96
+ "I-NOUN": 19,
97
+ "I-NUM": 23,
98
+ "I-PART": 36,
99
+ "I-PRON": 18,
100
+ "I-PROPN": 39,
101
+ "I-SCONJ": 2,
102
+ "I-SYM": 48,
103
+ "I-VERB": 31,
104
+ "I-X": 25,
105
+ "INTJ": 29,
106
+ "NOUN": 11,
107
+ "NUM": 12,
108
+ "PART": 5,
109
+ "PRON": 9,
110
+ "PROPN": 46,
111
+ "PUNCT": 13,
112
+ "SCONJ": 0,
113
+ "SYM": 42,
114
+ "VERB": 3,
115
+ "X": 38
116
  },
117
  "layer_norm_eps": 1e-12,
118
  "max_position_embeddings": 128,
 
123
  "position_embedding_type": "absolute",
124
  "tokenizer_class": "RemBertTokenizerFast",
125
  "torch_dtype": "float32",
126
+ "transformers_version": "4.11.3",
127
  "type_vocab_size": 2,
128
  "use_cache": true,
129
  "vocab_size": 250315