KoichiYasuoka commited on
Commit
e392d45
1 Parent(s): 328130f

re-initialize

Browse files
suparkanbun/models/guwenbert-base.pos/config.json ADDED
@@ -0,0 +1,291 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ethanyt/guwenbert-base",
3
+ "architectures": [
4
+ "RobertaForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "finetuning_task": "ner",
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "n,代名詞,人称,他,PRON,Person=1|PronType=Prs",
16
+ "1": "n,代名詞,人称,他,PRON,Person=2|PronType=Prs",
17
+ "2": "n,代名詞,人称,他,PRON,Person=3|PronType=Prs",
18
+ "3": "n,代名詞,人称,他,PRON,PronType=Prs",
19
+ "4": "n,代名詞,人称,他,PRON,PronType=Prs|Reflex=Yes",
20
+ "5": "n,代名詞,人称,止格,PRON,Person=1|PronType=Prs",
21
+ "6": "n,代名詞,人称,止格,PRON,Person=2|PronType=Prs",
22
+ "7": "n,代名詞,人称,止格,PRON,Person=3|PronType=Prs",
23
+ "8": "n,代名詞,人称,止格,PRON,PronType=Prs",
24
+ "9": "n,代名詞,人称,起格,PRON,Person=1|PronType=Prs",
25
+ "10": "n,代名詞,人称,起格,PRON,Person=2|PronType=Prs",
26
+ "11": "n,代名詞,人称,起格,PRON,Person=3|PronType=Prs",
27
+ "12": "n,代名詞,人称,起格,PRON,PronType=Prs",
28
+ "13": "n,代名詞,指示,*,PRON,PronType=Dem",
29
+ "14": "n,代名詞,疑問,*,PRON,PronType=Int",
30
+ "15": "n,名詞,不可譲,属性,NOUN,_",
31
+ "16": "n,名詞,不可譲,疾病,NOUN,_",
32
+ "17": "n,名詞,不可譲,身体,NOUN,_",
33
+ "18": "n,名詞,主体,動物,NOUN,_",
34
+ "19": "n,名詞,主体,国名,PROPN,Case=Loc|NameType=Nat",
35
+ "20": "n,名詞,主体,書物,NOUN,_",
36
+ "21": "n,名詞,主体,機関,NOUN,_",
37
+ "22": "n,名詞,主体,集団,NOUN,_",
38
+ "23": "n,名詞,人,その他の人名,PROPN,NameType=Prs",
39
+ "24": "n,名詞,人,人,NOUN,_",
40
+ "25": "n,名詞,人,名,PROPN,NameType=Giv",
41
+ "26": "n,名詞,人,姓氏,PROPN,NameType=Sur",
42
+ "27": "n,名詞,人,役割,NOUN,_",
43
+ "28": "n,名詞,人,複合的人名,PROPN,NameType=Prs",
44
+ "29": "n,名詞,人,関係,NOUN,_",
45
+ "30": "n,名詞,制度,儀礼,NOUN,_",
46
+ "31": "n,名詞,制度,場,NOUN,Case=Loc",
47
+ "32": "n,名詞,可搬,乗り物,NOUN,_",
48
+ "33": "n,名詞,可搬,伝達,NOUN,_",
49
+ "34": "n,名詞,可搬,成果物,NOUN,_",
50
+ "35": "n,名詞,可搬,糧食,NOUN,_",
51
+ "36": "n,名詞,可搬,道具,NOUN,_",
52
+ "37": "n,名詞,固定物,地名,PROPN,Case=Loc|NameType=Geo",
53
+ "38": "n,名詞,固定物,地形,NOUN,Case=Loc",
54
+ "39": "n,名詞,固定物,建造物,NOUN,Case=Loc",
55
+ "40": "n,名詞,固定物,樹木,NOUN,_",
56
+ "41": "n,名詞,固定物,関係,NOUN,Case=Loc",
57
+ "42": "n,名詞,外観,人,NOUN,_",
58
+ "43": "n,名詞,天象,天文,NOUN,_",
59
+ "44": "n,名詞,天象,怪異,NOUN,_",
60
+ "45": "n,名詞,天象,気象,NOUN,_",
61
+ "46": "n,名詞,度量衡,*,NOUN,NounType=Clf",
62
+ "47": "n,名詞,思考,*,NOUN,_",
63
+ "48": "n,名詞,描写,形質,NOUN,_",
64
+ "49": "n,名詞,描写,態度,NOUN,_",
65
+ "50": "n,名詞,数量,*,NOUN,_",
66
+ "51": "n,名詞,時,*,NOUN,Case=Tem",
67
+ "52": "n,名詞,行為,*,NOUN,_",
68
+ "53": "n,数詞,干支,*,NUM,NumType=Ord",
69
+ "54": "n,数詞,数,*,NUM,_",
70
+ "55": "n,数詞,数字,*,NUM,_",
71
+ "56": "p,助詞,句末,*,PART,_",
72
+ "57": "p,助詞,句頭,*,PART,_",
73
+ "58": "p,助詞,接続,並列,CCONJ,_",
74
+ "59": "p,助詞,接続,体言化,PART,_",
75
+ "60": "p,助詞,接続,属格,SCONJ,_",
76
+ "61": "p,助詞,提示,*,PART,_",
77
+ "62": "p,感嘆詞,*,*,INTJ,_",
78
+ "63": "p,接尾辞,*,*,PART,_",
79
+ "64": "s,文字,*,*,SYM,_",
80
+ "65": "s,記号,一般,*,SYM,_",
81
+ "66": "s,記号,句点,*,PUNCT,_",
82
+ "67": "s,記号,読点,*,PUNCT,_",
83
+ "68": "v,前置詞,基盤,*,ADP,_",
84
+ "69": "v,前置詞,源泉,*,ADP,_",
85
+ "70": "v,前置詞,経由,*,ADP,_",
86
+ "71": "v,前置詞,関係,*,ADP,_",
87
+ "72": "v,副詞,判断,推定,ADV,_",
88
+ "73": "v,副詞,判断,確定,ADV,_",
89
+ "74": "v,副詞,判断,逆接,ADV,_",
90
+ "75": "v,副詞,否定,体言否定,ADV,Polarity=Neg",
91
+ "76": "v,副詞,否定,有界,ADV,Polarity=Neg",
92
+ "77": "v,副詞,否定,無界,ADV,Polarity=Neg",
93
+ "78": "v,副詞,否定,禁止,ADV,Polarity=Neg",
94
+ "79": "v,副詞,描写,*,ADV,_",
95
+ "80": "v,副詞,時相,変化,ADV,AdvType=Tim",
96
+ "81": "v,副詞,時相,完了,ADV,AdvType=Tim|Aspect=Perf",
97
+ "82": "v,副詞,時相,将来,ADV,AdvType=Tim|Tense=Fut",
98
+ "83": "v,副詞,時相,恒常,ADV,AdvType=Tim",
99
+ "84": "v,副詞,時相,現在,ADV,AdvType=Tim|Tense=Pres",
100
+ "85": "v,副詞,時相,終局,ADV,AdvType=Tim",
101
+ "86": "v,副詞,時相,継起,ADV,AdvType=Tim",
102
+ "87": "v,副詞,時相,緊接,ADV,AdvType=Tim",
103
+ "88": "v,副詞,時相,過去,ADV,AdvType=Tim|Tense=Past",
104
+ "89": "v,副詞,疑問,原因,ADV,AdvType=Cau",
105
+ "90": "v,副詞,疑問,反語,ADV,_",
106
+ "91": "v,副詞,疑問,所在,ADV,_",
107
+ "92": "v,副詞,程度,やや高度,ADV,AdvType=Deg|Degree=Cmp",
108
+ "93": "v,副詞,程度,極度,ADV,AdvType=Deg|Degree=Sup",
109
+ "94": "v,副詞,程度,軽度,ADV,AdvType=Deg|Degree=Pos",
110
+ "95": "v,副詞,範囲,共同,ADV,_",
111
+ "96": "v,副詞,範囲,総括,ADV,_",
112
+ "97": "v,副詞,範囲,限定,ADV,_",
113
+ "98": "v,副詞,頻度,偶発,ADV,_",
114
+ "99": "v,副詞,頻度,重複,ADV,_",
115
+ "100": "v,副詞,頻度,頻繁,ADV,_",
116
+ "101": "v,助動詞,受動,*,AUX,Voice=Pass",
117
+ "102": "v,助動詞,可能,*,AUX,Mood=Pot",
118
+ "103": "v,助動詞,必要,*,AUX,Mood=Nec",
119
+ "104": "v,助動詞,願望,*,AUX,Mood=Des",
120
+ "105": "v,動詞,変化,制度,VERB,_",
121
+ "106": "v,動詞,変化,性質,VERB,_",
122
+ "107": "v,動詞,変化,生物,VERB,_",
123
+ "108": "v,動詞,存在,存在,VERB,Polarity=Neg",
124
+ "109": "v,動詞,存在,存在,VERB,VerbType=Cop",
125
+ "110": "v,動詞,存在,存在,VERB,_",
126
+ "111": "v,動詞,描写,境遇,VERB,Degree=Pos",
127
+ "112": "v,動詞,描写,形質,VERB,Degree=Pos",
128
+ "113": "v,動詞,描写,態度,VERB,Degree=Pos",
129
+ "114": "v,動詞,描写,量,VERB,Degree=Pos",
130
+ "115": "v,動詞,行為,交流,VERB,_",
131
+ "116": "v,動詞,行為,伝達,VERB,_",
132
+ "117": "v,動詞,行為,使役,VERB,_",
133
+ "118": "v,動詞,行為,儀礼,VERB,_",
134
+ "119": "v,動詞,行為,分類,VERB,Degree=Equ",
135
+ "120": "v,動詞,行為,動作,VERB,_",
136
+ "121": "v,動詞,行為,姿勢,VERB,_",
137
+ "122": "v,動詞,行為,役割,VERB,_",
138
+ "123": "v,動詞,行為,得失,VERB,_",
139
+ "124": "v,動詞,行為,態度,VERB,_",
140
+ "125": "v,動詞,行為,生産,VERB,_",
141
+ "126": "v,動詞,行為,移動,VERB,_",
142
+ "127": "v,動詞,行為,設置,VERB,_",
143
+ "128": "v,動詞,行為,飲食,VERB,_"
144
+ },
145
+ "initializer_range": 0.02,
146
+ "intermediate_size": 3072,
147
+ "label2id": {
148
+ "n,代名詞,人称,他,PRON,Person=1|PronType=Prs": 0,
149
+ "n,代名詞,人称,他,PRON,Person=2|PronType=Prs": 1,
150
+ "n,代名詞,人称,他,PRON,Person=3|PronType=Prs": 2,
151
+ "n,代名詞,人称,他,PRON,PronType=Prs": 3,
152
+ "n,代名詞,人称,他,PRON,PronType=Prs|Reflex=Yes": 4,
153
+ "n,代名詞,人称,止格,PRON,Person=1|PronType=Prs": 5,
154
+ "n,代名詞,人称,止格,PRON,Person=2|PronType=Prs": 6,
155
+ "n,代名詞,人称,止格,PRON,Person=3|PronType=Prs": 7,
156
+ "n,代名詞,人称,止格,PRON,PronType=Prs": 8,
157
+ "n,代名詞,人称,起格,PRON,Person=1|PronType=Prs": 9,
158
+ "n,代名詞,人称,起格,PRON,Person=2|PronType=Prs": 10,
159
+ "n,代名詞,人称,起格,PRON,Person=3|PronType=Prs": 11,
160
+ "n,代名詞,人称,起格,PRON,PronType=Prs": 12,
161
+ "n,代名詞,指示,*,PRON,PronType=Dem": 13,
162
+ "n,代名詞,疑問,*,PRON,PronType=Int": 14,
163
+ "n,名詞,不可譲,属性,NOUN,_": 15,
164
+ "n,名詞,不可譲,疾病,NOUN,_": 16,
165
+ "n,名詞,不可譲,身体,NOUN,_": 17,
166
+ "n,名詞,主体,動物,NOUN,_": 18,
167
+ "n,名詞,主体,国名,PROPN,Case=Loc|NameType=Nat": 19,
168
+ "n,名詞,主体,書物,NOUN,_": 20,
169
+ "n,名詞,主体,機関,NOUN,_": 21,
170
+ "n,名詞,主体,集団,NOUN,_": 22,
171
+ "n,名詞,人,その他の人名,PROPN,NameType=Prs": 23,
172
+ "n,名詞,人,人,NOUN,_": 24,
173
+ "n,名詞,人,名,PROPN,NameType=Giv": 25,
174
+ "n,名詞,人,姓氏,PROPN,NameType=Sur": 26,
175
+ "n,名詞,人,役割,NOUN,_": 27,
176
+ "n,名詞,人,複合的人名,PROPN,NameType=Prs": 28,
177
+ "n,名詞,人,関係,NOUN,_": 29,
178
+ "n,名詞,制度,儀礼,NOUN,_": 30,
179
+ "n,名詞,制度,場,NOUN,Case=Loc": 31,
180
+ "n,名詞,可搬,乗り物,NOUN,_": 32,
181
+ "n,名詞,可搬,伝達,NOUN,_": 33,
182
+ "n,名詞,可搬,成果物,NOUN,_": 34,
183
+ "n,名詞,可搬,糧食,NOUN,_": 35,
184
+ "n,名詞,可搬,道具,NOUN,_": 36,
185
+ "n,名詞,固定物,地名,PROPN,Case=Loc|NameType=Geo": 37,
186
+ "n,名詞,固定物,地形,NOUN,Case=Loc": 38,
187
+ "n,名詞,固定物,建造物,NOUN,Case=Loc": 39,
188
+ "n,名詞,固定物,樹木,NOUN,_": 40,
189
+ "n,名詞,固定物,関係,NOUN,Case=Loc": 41,
190
+ "n,名詞,外観,人,NOUN,_": 42,
191
+ "n,名詞,天象,天文,NOUN,_": 43,
192
+ "n,名詞,天象,怪異,NOUN,_": 44,
193
+ "n,名詞,天象,気象,NOUN,_": 45,
194
+ "n,名詞,度量衡,*,NOUN,NounType=Clf": 46,
195
+ "n,名詞,思考,*,NOUN,_": 47,
196
+ "n,名詞,描写,形質,NOUN,_": 48,
197
+ "n,名詞,描写,態度,NOUN,_": 49,
198
+ "n,名詞,数量,*,NOUN,_": 50,
199
+ "n,名詞,時,*,NOUN,Case=Tem": 51,
200
+ "n,名詞,行為,*,NOUN,_": 52,
201
+ "n,数詞,干支,*,NUM,NumType=Ord": 53,
202
+ "n,数詞,数,*,NUM,_": 54,
203
+ "n,数詞,数字,*,NUM,_": 55,
204
+ "p,助詞,句末,*,PART,_": 56,
205
+ "p,助詞,句頭,*,PART,_": 57,
206
+ "p,助詞,接続,並列,CCONJ,_": 58,
207
+ "p,助詞,接続,体言化,PART,_": 59,
208
+ "p,助詞,接続,属格,SCONJ,_": 60,
209
+ "p,助詞,提示,*,PART,_": 61,
210
+ "p,感嘆詞,*,*,INTJ,_": 62,
211
+ "p,接尾辞,*,*,PART,_": 63,
212
+ "s,文字,*,*,SYM,_": 64,
213
+ "s,記号,一般,*,SYM,_": 65,
214
+ "s,記号,句点,*,PUNCT,_": 66,
215
+ "s,記号,読点,*,PUNCT,_": 67,
216
+ "v,前置詞,基盤,*,ADP,_": 68,
217
+ "v,前置詞,源泉,*,ADP,_": 69,
218
+ "v,前置詞,経由,*,ADP,_": 70,
219
+ "v,前置詞,関係,*,ADP,_": 71,
220
+ "v,副詞,判断,推定,ADV,_": 72,
221
+ "v,副詞,判断,確定,ADV,_": 73,
222
+ "v,副詞,判断,逆接,ADV,_": 74,
223
+ "v,副詞,否定,体言否定,ADV,Polarity=Neg": 75,
224
+ "v,副詞,否定,有界,ADV,Polarity=Neg": 76,
225
+ "v,副詞,否定,無界,ADV,Polarity=Neg": 77,
226
+ "v,副詞,否定,禁止,ADV,Polarity=Neg": 78,
227
+ "v,副詞,描写,*,ADV,_": 79,
228
+ "v,副詞,時相,変化,ADV,AdvType=Tim": 80,
229
+ "v,副詞,時相,完了,ADV,AdvType=Tim|Aspect=Perf": 81,
230
+ "v,副詞,時相,将来,ADV,AdvType=Tim|Tense=Fut": 82,
231
+ "v,副詞,時相,恒常,ADV,AdvType=Tim": 83,
232
+ "v,副詞,時相,現在,ADV,AdvType=Tim|Tense=Pres": 84,
233
+ "v,副詞,時相,終局,ADV,AdvType=Tim": 85,
234
+ "v,副詞,時相,継起,ADV,AdvType=Tim": 86,
235
+ "v,副詞,時相,緊接,ADV,AdvType=Tim": 87,
236
+ "v,副詞,時相,過去,ADV,AdvType=Tim|Tense=Past": 88,
237
+ "v,副詞,疑問,原因,ADV,AdvType=Cau": 89,
238
+ "v,副詞,疑問,反語,ADV,_": 90,
239
+ "v,副詞,疑問,所在,ADV,_": 91,
240
+ "v,副詞,程度,やや高度,ADV,AdvType=Deg|Degree=Cmp": 92,
241
+ "v,副詞,程度,極度,ADV,AdvType=Deg|Degree=Sup": 93,
242
+ "v,副詞,程度,軽度,ADV,AdvType=Deg|Degree=Pos": 94,
243
+ "v,副詞,範囲,共同,ADV,_": 95,
244
+ "v,副詞,範囲,総括,ADV,_": 96,
245
+ "v,副詞,範囲,限定,ADV,_": 97,
246
+ "v,副詞,頻度,偶発,ADV,_": 98,
247
+ "v,副詞,頻度,重複,ADV,_": 99,
248
+ "v,副詞,頻度,頻繁,ADV,_": 100,
249
+ "v,助動詞,受動,*,AUX,Voice=Pass": 101,
250
+ "v,助動詞,可能,*,AUX,Mood=Pot": 102,
251
+ "v,助動詞,必要,*,AUX,Mood=Nec": 103,
252
+ "v,助動詞,願望,*,AUX,Mood=Des": 104,
253
+ "v,動詞,変化,制度,VERB,_": 105,
254
+ "v,動詞,変化,性質,VERB,_": 106,
255
+ "v,動詞,変化,生物,VERB,_": 107,
256
+ "v,動詞,存在,存在,VERB,Polarity=Neg": 108,
257
+ "v,動詞,存在,存在,VERB,VerbType=Cop": 109,
258
+ "v,動詞,存在,存在,VERB,_": 110,
259
+ "v,動詞,描写,境遇,VERB,Degree=Pos": 111,
260
+ "v,動詞,描写,形質,VERB,Degree=Pos": 112,
261
+ "v,動詞,描写,態度,VERB,Degree=Pos": 113,
262
+ "v,動詞,描写,量,VERB,Degree=Pos": 114,
263
+ "v,動詞,行為,交流,VERB,_": 115,
264
+ "v,動詞,行為,伝達,VERB,_": 116,
265
+ "v,動詞,行為,使役,VERB,_": 117,
266
+ "v,動詞,行為,儀礼,VERB,_": 118,
267
+ "v,動詞,行為,分類,VERB,Degree=Equ": 119,
268
+ "v,動詞,行為,動作,VERB,_": 120,
269
+ "v,動詞,行為,姿勢,VERB,_": 121,
270
+ "v,動詞,行為,役割,VERB,_": 122,
271
+ "v,動詞,行為,得失,VERB,_": 123,
272
+ "v,動詞,行為,態度,VERB,_": 124,
273
+ "v,動詞,行為,生産,VERB,_": 125,
274
+ "v,動詞,行為,移動,VERB,_": 126,
275
+ "v,動詞,行為,設置,VERB,_": 127,
276
+ "v,動詞,行為,飲食,VERB,_": 128
277
+ },
278
+ "layer_norm_eps": 1e-05,
279
+ "max_position_embeddings": 514,
280
+ "model_type": "roberta",
281
+ "num_attention_heads": 12,
282
+ "num_hidden_layers": 12,
283
+ "pad_token_id": 1,
284
+ "position_embedding_type": "absolute",
285
+ "tokenizer_class": "BertTokenizer",
286
+ "torch_dtype": "float32",
287
+ "transformers_version": "4.9.2",
288
+ "type_vocab_size": 1,
289
+ "use_cache": true,
290
+ "vocab_size": 23292
291
+ }
suparkanbun/models/guwenbert-base.pos/filesize.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ pytorch_model.bin 413843728
2
+ guwenbert-base.supar 463070836
suparkanbun/models/guwenbert-base.pos/guwenbert-base.supar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0dff1df3a532e5570a80fe56cb1345bfa2c6018df1a80f351906e1ad7b2b416
3
+ size 463070836
suparkanbun/models/guwenbert-base.pos/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12f3d827a041fe44879e25031ba74bec5c6f7408b211dff0b2ebedbf8c40dace
3
+ size 413843728
suparkanbun/models/guwenbert-base.pos/special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
suparkanbun/models/guwenbert-base.pos/tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-base", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
suparkanbun/models/guwenbert-base.pos/vocab.txt ADDED
The diff for this file is too large to render. See raw diff