Commit
•
7bd4e87
1
Parent(s):
b227d59
model improved
Browse files- setup.py +1 -1
- suparkanbun/models/gloss.orig.txt +12 -0
- suparkanbun/models/guwenbert-base.danku/config.json +14 -14
- suparkanbun/models/guwenbert-base.danku/filesize.txt +1 -1
- suparkanbun/models/guwenbert-base.danku/pytorch_model.bin +2 -2
- suparkanbun/models/guwenbert-base.danku/tokenizer_config.json +1 -1
- suparkanbun/models/guwenbert-base.pos/config.json +260 -260
- suparkanbun/models/guwenbert-base.pos/filesize.txt +1 -1
- suparkanbun/models/guwenbert-base.pos/guwenbert-base.supar +2 -2
- suparkanbun/models/guwenbert-base.pos/pytorch_model.bin +1 -1
- suparkanbun/models/guwenbert-base.pos/tokenizer_config.json +1 -1
- suparkanbun/models/guwenbert-large.danku/config.json +14 -14
- suparkanbun/models/guwenbert-large.danku/filesize.txt +1 -1
- suparkanbun/models/guwenbert-large.danku/pytorch_model.bin +2 -2
- suparkanbun/models/guwenbert-large.danku/tokenizer_config.json +1 -1
- suparkanbun/models/guwenbert-large.pos/config.json +260 -260
- suparkanbun/models/guwenbert-large.pos/filesize.txt +2 -2
- suparkanbun/models/guwenbert-large.pos/guwenbert-large.supar +2 -2
- suparkanbun/models/guwenbert-large.pos/pytorch_model.bin +2 -2
- suparkanbun/models/guwenbert-large.pos/tokenizer_config.json +1 -1
- suparkanbun/models/lzh_kyoto.conllu +2 -2
- suparkanbun/models/mkmodel.sh +26 -26
- suparkanbun/models/roberta-classical-chinese-base-char.danku/config.json +14 -13
- suparkanbun/models/roberta-classical-chinese-base-char.danku/filesize.txt +1 -1
- suparkanbun/models/roberta-classical-chinese-base-char.danku/pytorch_model.bin +2 -2
- suparkanbun/models/roberta-classical-chinese-base-char.danku/tokenizer_config.json +1 -1
- suparkanbun/models/roberta-classical-chinese-large-char.danku/config.json +14 -13
- suparkanbun/models/roberta-classical-chinese-large-char.danku/filesize.txt +1 -1
- suparkanbun/models/roberta-classical-chinese-large-char.danku/pytorch_model.bin +2 -2
- suparkanbun/models/roberta-classical-chinese-large-char.danku/tokenizer_config.json +1 -1
- suparkanbun/models/roberta-classical-chinese-large-char.pos/config.json +260 -259
- suparkanbun/models/roberta-classical-chinese-large-char.pos/filesize.txt +2 -2
- suparkanbun/models/roberta-classical-chinese-large-char.pos/pytorch_model.bin +2 -2
- suparkanbun/models/roberta-classical-chinese-large-char.pos/roberta-classical-chinese-large-char.supar +2 -2
- suparkanbun/models/roberta-classical-chinese-large-char.pos/tokenizer_config.json +1 -1
- suparkanbun/models/sikubert.danku/config.json +14 -13
- suparkanbun/models/sikubert.danku/filesize.txt +1 -1
- suparkanbun/models/sikubert.danku/pytorch_model.bin +2 -2
- suparkanbun/models/sikubert.pos/config.json +260 -259
- suparkanbun/models/sikubert.pos/filesize.txt +2 -2
- suparkanbun/models/sikubert.pos/pytorch_model.bin +2 -2
- suparkanbun/models/sikubert.pos/sikubert.supar +2 -2
- suparkanbun/models/sikuroberta.danku/config.json +14 -13
- suparkanbun/models/sikuroberta.danku/filesize.txt +1 -1
- suparkanbun/models/sikuroberta.danku/pytorch_model.bin +2 -2
- suparkanbun/models/sikuroberta.pos/config.json +260 -259
- suparkanbun/models/sikuroberta.pos/filesize.txt +2 -2
- suparkanbun/models/sikuroberta.pos/pytorch_model.bin +2 -2
- suparkanbun/models/sikuroberta.pos/sikuroberta.supar +2 -2
setup.py
CHANGED
@@ -5,7 +5,7 @@ URL="https://github.com/KoichiYasuoka/SuPar-Kanbun"
|
|
5 |
|
6 |
setuptools.setup(
|
7 |
name="suparkanbun",
|
8 |
-
version="1.3.
|
9 |
description="Tokenizer POS-tagger and Dependency-parser for Classical Chinese",
|
10 |
long_description=long_description,
|
11 |
long_description_content_type="text/markdown",
|
|
|
5 |
|
6 |
setuptools.setup(
|
7 |
name="suparkanbun",
|
8 |
+
version="1.3.8",
|
9 |
description="Tokenizer POS-tagger and Dependency-parser for Classical Chinese",
|
10 |
long_description=long_description,
|
11 |
long_description_content_type="text/markdown",
|
suparkanbun/models/gloss.orig.txt
CHANGED
@@ -390,6 +390,8 @@
|
|
390 |
像 像 v,動詞,行為,動作 image
|
391 |
侨 僑 侨 v,動詞,行為,動作 sojourn
|
392 |
僑 僑 侨 v,動詞,行為,動作 sojourn
|
|
|
|
|
393 |
仆 僕 仆 n,名詞,人,役割 servant
|
394 |
僕 僕 仆 n,名詞,人,役割 servant
|
395 |
仆 僕 仆 v,動詞,描写,態度 intricate
|
@@ -613,6 +615,7 @@
|
|
613 |
功 功 n,名詞,可搬,成果物 achievement
|
614 |
加 加 v,動詞,行為,得失 add
|
615 |
助 助 v,動詞,行為,交流 help
|
|
|
616 |
劫 劫 v,動詞,行為,交流 rob
|
617 |
勃 勃 v,動詞,描写,形質 sudden
|
618 |
勇 勇 n,名詞,描写,態度 bravery
|
@@ -1047,6 +1050,8 @@
|
|
1047 |
堯典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
1048 |
尧典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
1049 |
尭典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
|
|
|
|
1050 |
報 報 报 v,動詞,行為,交流 report-back
|
1051 |
报 報 报 v,動詞,行為,交流 report-back
|
1052 |
场 場 场 n,名詞,固定物,建造物 meeting-place
|
@@ -2888,6 +2893,10 @@
|
|
2888 |
淇 淇 n,名詞,固定物,地名 [place-name]
|
2889 |
淑 淑 v,動詞,描写,態度 gentle
|
2890 |
淡 淡 v,動詞,描写,形質 thin
|
|
|
|
|
|
|
|
|
2891 |
淫 淫 n,名詞,描写,態度 licentious
|
2892 |
淫 淫 v,動詞,描写,態度 excessive
|
2893 |
深 深 v,動詞,描写,量 deep
|
@@ -3124,6 +3133,8 @@
|
|
3124 |
爽 爽 v,動詞,行為,交流 lively
|
3125 |
尔 爾 尔 n,代名詞,人称,止格 [2PRON]
|
3126 |
爾 爾 尔 n,代名詞,人称,止格 [2PRON]
|
|
|
|
|
3127 |
尔 爾 尔 p,助詞,句末,* [final-particle]
|
3128 |
爾 爾 尔 p,助詞,句末,* [final-particle]
|
3129 |
尔 爾 尔 p,接尾辞,*,* [suffix]
|
@@ -3409,6 +3420,7 @@
|
|
3409 |
目 目 v,動詞,行為,動作 look-at
|
3410 |
直 直 v,副詞,範囲,限定 only
|
3411 |
直 直 v,動詞,描写,形質 straight
|
|
|
3412 |
相 相 n,名詞,人,役割 chief-minister
|
3413 |
相 相 v,副詞,範囲,共同 each-other
|
3414 |
相 相 v,動詞,行為,交流 assist
|
|
|
390 |
像 像 v,動詞,行為,動作 image
|
391 |
侨 僑 侨 v,動詞,行為,動作 sojourn
|
392 |
僑 僑 侨 v,動詞,行為,動作 sojourn
|
393 |
+
仆 僕 仆 n,代名詞,人称,止格 [1PRON]
|
394 |
+
僕 僕 仆 n,代名詞,人称,止格 [1PRON]
|
395 |
仆 僕 仆 n,名詞,人,役割 servant
|
396 |
僕 僕 仆 n,名詞,人,役割 servant
|
397 |
仆 僕 仆 v,動詞,描写,態度 intricate
|
|
|
615 |
功 功 n,名詞,可搬,成果物 achievement
|
616 |
加 加 v,動詞,行為,得失 add
|
617 |
助 助 v,動詞,行為,交流 help
|
618 |
+
劫 劫 n,名詞,時,* kalpa
|
619 |
劫 劫 v,動詞,行為,交流 rob
|
620 |
勃 勃 v,動詞,描写,形質 sudden
|
621 |
勇 勇 n,名詞,描写,態度 bravery
|
|
|
1050 |
堯典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
1051 |
尧典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
1052 |
尭典 堯典 尧典 n,名詞,主体,書物 [book-name]
|
1053 |
+
報 報 报 n,名詞,可搬,成果物 retribution
|
1054 |
+
报 報 报 n,名詞,可搬,成果物 retribution
|
1055 |
報 報 报 v,動詞,行為,交流 report-back
|
1056 |
报 報 报 v,動詞,行為,交流 report-back
|
1057 |
场 場 场 n,名詞,固定物,建造物 meeting-place
|
|
|
2893 |
淇 淇 n,名詞,固定物,地名 [place-name]
|
2894 |
淑 淑 v,動詞,描写,態度 gentle
|
2895 |
淡 淡 v,動詞,描写,形質 thin
|
2896 |
+
净 淨 净 v,動詞,描写,形質 clean
|
2897 |
+
凈 淨 净 v,動詞,描写,形質 clean
|
2898 |
+
浄 淨 净 v,動詞,描写,形質 clean
|
2899 |
+
淨 淨 净 v,動詞,描写,形質 clean
|
2900 |
淫 淫 n,名詞,描写,態度 licentious
|
2901 |
淫 淫 v,動詞,描写,態度 excessive
|
2902 |
深 深 v,動詞,描写,量 deep
|
|
|
3133 |
爽 爽 v,動詞,行為,交流 lively
|
3134 |
尔 爾 尔 n,代名詞,人称,止格 [2PRON]
|
3135 |
爾 爾 尔 n,代名詞,人称,止格 [2PRON]
|
3136 |
+
尔 爾 尔 n,代名詞,指示,* this
|
3137 |
+
爾 爾 尔 n,代名詞,指示,* this
|
3138 |
尔 爾 尔 p,助詞,句末,* [final-particle]
|
3139 |
爾 爾 尔 p,助詞,句末,* [final-particle]
|
3140 |
尔 爾 尔 p,接尾辞,*,* [suffix]
|
|
|
3420 |
目 目 v,動詞,行為,動作 look-at
|
3421 |
直 直 v,副詞,範囲,限定 only
|
3422 |
直 直 v,動詞,描写,形質 straight
|
3423 |
+
相 相 n,名詞,不可譲,身体 appearlance
|
3424 |
相 相 n,名詞,人,役割 chief-minister
|
3425 |
相 相 v,副詞,範囲,共同 each-other
|
3426 |
相 相 v,動詞,行為,交流 assist
|
suparkanbun/models/guwenbert-base.danku/config.json
CHANGED
@@ -5,29 +5,29 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
-
"gradient_checkpointing": false,
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
-
"0": "
|
16 |
-
"1": "
|
17 |
-
"2": "
|
18 |
-
"3": "
|
19 |
-
"4": "
|
20 |
-
"5": "
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 3072,
|
24 |
"label2id": {
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
@@ -38,7 +38,7 @@
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
-
"transformers_version": "4.
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 23292
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
|
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "B",
|
16 |
+
"1": "E",
|
17 |
+
"2": "E2",
|
18 |
+
"3": "E3",
|
19 |
+
"4": "M",
|
20 |
+
"5": "S"
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 3072,
|
24 |
"label2id": {
|
25 |
+
"B": 0,
|
26 |
+
"E": 1,
|
27 |
+
"E2": 2,
|
28 |
+
"E3": 3,
|
29 |
+
"M": 4,
|
30 |
+
"S": 5
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
+
"transformers_version": "4.11.3",
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 23292
|
suparkanbun/models/guwenbert-base.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 413465359
|
suparkanbun/models/guwenbert-base.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a0a39f0241d2b97409c36c4fe8a75c790f3f4af1db7900a3b795c2a47fb6299
|
3 |
+
size 413465359
|
suparkanbun/models/guwenbert-base.danku/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-base", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "add_prefix_space": true, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-base", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/guwenbert-base.pos/config.json
CHANGED
@@ -5,275 +5,275 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
-
"gradient_checkpointing": false,
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
-
"0": "n
|
16 |
-
"1": "n
|
17 |
-
"2": "n
|
18 |
-
"3": "n
|
19 |
-
"4": "n
|
20 |
-
"5": "n
|
21 |
-
"6": "n
|
22 |
-
"7": "n
|
23 |
-
"8": "n
|
24 |
-
"9": "n
|
25 |
-
"10": "n
|
26 |
-
"11": "n
|
27 |
-
"12": "n
|
28 |
-
"13": "n
|
29 |
-
"14": "n
|
30 |
-
"15": "n
|
31 |
-
"16": "n
|
32 |
-
"17": "n
|
33 |
-
"18": "n
|
34 |
-
"19": "n
|
35 |
-
"20": "n
|
36 |
-
"21": "n
|
37 |
-
"22": "n
|
38 |
-
"23": "n
|
39 |
-
"24": "n
|
40 |
-
"25": "n
|
41 |
-
"26": "n
|
42 |
-
"27": "n
|
43 |
-
"28": "n
|
44 |
-
"29": "n
|
45 |
-
"30": "n
|
46 |
-
"31": "n
|
47 |
-
"32": "n
|
48 |
-
"33": "n
|
49 |
-
"34": "n
|
50 |
-
"35": "n
|
51 |
-
"36": "n
|
52 |
-
"37": "n
|
53 |
-
"38": "n
|
54 |
-
"39": "n
|
55 |
-
"40": "n
|
56 |
-
"41": "n
|
57 |
-
"42": "n
|
58 |
-
"43": "n
|
59 |
-
"44": "n
|
60 |
-
"45": "n
|
61 |
-
"46": "n
|
62 |
-
"47": "n
|
63 |
-
"48": "n
|
64 |
-
"49": "n
|
65 |
-
"50": "n
|
66 |
-
"51": "n
|
67 |
-
"52": "n
|
68 |
-
"53": "n
|
69 |
-
"54": "n
|
70 |
-
"55": "n
|
71 |
-
"56": "p
|
72 |
-
"57": "p
|
73 |
-
"58": "p
|
74 |
-
"59": "p
|
75 |
-
"60": "p
|
76 |
-
"61": "p
|
77 |
-
"62": "p
|
78 |
-
"63": "p
|
79 |
-
"64": "s
|
80 |
-
"65": "s
|
81 |
-
"66": "s
|
82 |
-
"67": "s
|
83 |
-
"68": "v
|
84 |
-
"69": "v
|
85 |
-
"70": "v
|
86 |
-
"71": "v
|
87 |
-
"72": "v
|
88 |
-
"73": "v
|
89 |
-
"74": "v
|
90 |
-
"75": "v
|
91 |
-
"76": "v
|
92 |
-
"77": "v
|
93 |
-
"78": "v
|
94 |
-
"79": "v
|
95 |
-
"80": "v
|
96 |
-
"81": "v
|
97 |
-
"82": "v
|
98 |
-
"83": "v
|
99 |
-
"84": "v
|
100 |
-
"85": "v
|
101 |
-
"86": "v
|
102 |
-
"87": "v
|
103 |
-
"88": "v
|
104 |
-
"89": "v
|
105 |
-
"90": "v
|
106 |
-
"91": "v
|
107 |
-
"92": "v
|
108 |
-
"93": "v
|
109 |
-
"94": "v
|
110 |
-
"95": "v
|
111 |
-
"96": "v
|
112 |
-
"97": "v
|
113 |
-
"98": "v
|
114 |
-
"99": "v
|
115 |
-
"100": "v
|
116 |
-
"101": "v
|
117 |
-
"102": "v
|
118 |
-
"103": "v
|
119 |
-
"104": "v
|
120 |
-
"105": "v
|
121 |
-
"106": "v
|
122 |
-
"107": "v
|
123 |
-
"108": "v
|
124 |
-
"109": "v
|
125 |
-
"110": "v
|
126 |
-
"111": "v
|
127 |
-
"112": "v
|
128 |
-
"113": "v
|
129 |
-
"114": "v
|
130 |
-
"115": "v
|
131 |
-
"116": "v
|
132 |
-
"117": "v
|
133 |
-
"118": "v
|
134 |
-
"119": "v
|
135 |
-
"120": "v
|
136 |
-
"121": "v
|
137 |
-
"122": "v
|
138 |
-
"123": "v
|
139 |
-
"124": "v
|
140 |
-
"125": "v
|
141 |
-
"126": "v
|
142 |
-
"127": "v
|
143 |
-
"128": "v
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 3072,
|
147 |
"label2id": {
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"n
|
204 |
-
"p
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"p
|
212 |
-
"s
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"s
|
216 |
-
"v
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
-
"v
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
@@ -284,7 +284,7 @@
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
-
"transformers_version": "4.
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 23292
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
|
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
16 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
17 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
18 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
19 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
20 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
21 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
22 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
23 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
24 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
25 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
26 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
27 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
28 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
29 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
30 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
31 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
32 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
33 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
34 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
35 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
36 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
37 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
38 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
39 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
40 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
41 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
42 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
43 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
44 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
45 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
46 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
47 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
48 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
49 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
50 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
51 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
52 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
53 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
54 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
55 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
56 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
57 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
58 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
59 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
60 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
61 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
62 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_",
|
63 |
+
"48": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
64 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
65 |
+
"50": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
66 |
+
"51": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
67 |
+
"52": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
68 |
+
"53": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
69 |
+
"54": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
70 |
+
"55": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
71 |
+
"56": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
72 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
73 |
+
"58": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
74 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
75 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
76 |
+
"61": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
77 |
+
"62": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
78 |
+
"63": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
79 |
+
"64": "s,\u6587\u5b57,*,*,SYM,_",
|
80 |
+
"65": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
81 |
+
"66": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
82 |
+
"67": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
83 |
+
"68": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
84 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
85 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
86 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
87 |
+
"72": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
88 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
89 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
90 |
+
"75": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
91 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
92 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
93 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
94 |
+
"79": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
95 |
+
"80": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
96 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
97 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
98 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
99 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
100 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
101 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
102 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
103 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
104 |
+
"89": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
105 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
106 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
107 |
+
"92": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
108 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
109 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
110 |
+
"95": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
111 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
112 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
113 |
+
"98": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
114 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
115 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
116 |
+
"101": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
117 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
118 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
119 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
120 |
+
"105": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
121 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
122 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
123 |
+
"108": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
124 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
125 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
126 |
+
"111": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
127 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
128 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
129 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
130 |
+
"115": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
131 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
132 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
133 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
134 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
135 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
136 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
137 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
138 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
139 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
140 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
141 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
142 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
143 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 3072,
|
147 |
"label2id": {
|
148 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
162 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
165 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
171 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
178 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
180 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
185 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
190 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
191 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
194 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
195 |
+
"n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_": 47,
|
196 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 48,
|
197 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 49,
|
198 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 50,
|
199 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 51,
|
200 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 52,
|
201 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 53,
|
202 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 54,
|
203 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 55,
|
204 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 56,
|
205 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 57,
|
206 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 58,
|
207 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 59,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 60,
|
209 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 61,
|
210 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 62,
|
211 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 63,
|
212 |
+
"s,\u6587\u5b57,*,*,SYM,_": 64,
|
213 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 65,
|
214 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 66,
|
215 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 67,
|
216 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 68,
|
217 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 69,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 70,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 71,
|
220 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 72,
|
221 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 73,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 74,
|
223 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 75,
|
224 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 76,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 77,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 78,
|
227 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 79,
|
228 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 80,
|
229 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 81,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 82,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 83,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 84,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 85,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 86,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 87,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 88,
|
237 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 89,
|
238 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 90,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 91,
|
240 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 92,
|
241 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 93,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 94,
|
243 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 95,
|
244 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 96,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 97,
|
246 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 98,
|
247 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 99,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 100,
|
249 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 101,
|
250 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 102,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 103,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 104,
|
253 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 105,
|
254 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 106,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 107,
|
256 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 108,
|
257 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 109,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 110,
|
259 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 111,
|
260 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 112,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 113,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 114,
|
263 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 115,
|
264 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 116,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 117,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 118,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 119,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 120,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 121,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 122,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 123,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 124,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 125,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 126,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 127,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 128
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
+
"transformers_version": "4.11.3",
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 23292
|
suparkanbun/models/guwenbert-base.pos/filesize.txt
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
pytorch_model.bin 413843728
|
2 |
-
guwenbert-base.supar
|
|
|
1 |
pytorch_model.bin 413843728
|
2 |
+
guwenbert-base.supar 463146853
|
suparkanbun/models/guwenbert-base.pos/guwenbert-base.supar
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4329e50810946da48573aff14d9985979145d92b160040195399311fd519ccd9
|
3 |
+
size 463146853
|
suparkanbun/models/guwenbert-base.pos/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 413843728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35f764f15e5183760b4e36563ea37e28ceafcdf8cfe1827c56195533941ef426
|
3 |
size 413843728
|
suparkanbun/models/guwenbert-base.pos/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-base", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "add_prefix_space": true, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-base", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/guwenbert-large.danku/config.json
CHANGED
@@ -5,29 +5,29 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
-
"gradient_checkpointing": false,
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
-
"0": "
|
16 |
-
"1": "
|
17 |
-
"2": "
|
18 |
-
"3": "
|
19 |
-
"4": "
|
20 |
-
"5": "
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 4096,
|
24 |
"label2id": {
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
@@ -38,7 +38,7 @@
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
-
"transformers_version": "4.
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 23292
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
|
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
+
"0": "B",
|
16 |
+
"1": "E",
|
17 |
+
"2": "E2",
|
18 |
+
"3": "E3",
|
19 |
+
"4": "M",
|
20 |
+
"5": "S"
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 4096,
|
24 |
"label2id": {
|
25 |
+
"B": 0,
|
26 |
+
"E": 1,
|
27 |
+
"E2": 2,
|
28 |
+
"E3": 3,
|
29 |
+
"M": 4,
|
30 |
+
"S": 5
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
+
"transformers_version": "4.11.3",
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 23292
|
suparkanbun/models/guwenbert-large.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 1306952530
|
suparkanbun/models/guwenbert-large.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95d01a28f549a42276365e842108af2fe173096e05e33bb9da96f89ee6d4aff6
|
3 |
+
size 1306952530
|
suparkanbun/models/guwenbert-large.danku/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-large", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "add_prefix_space": true, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-large", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/guwenbert-large.pos/config.json
CHANGED
@@ -5,275 +5,275 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
-
"gradient_checkpointing": false,
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
-
"0": "n
|
16 |
-
"1": "n
|
17 |
-
"2": "n
|
18 |
-
"3": "n
|
19 |
-
"4": "n
|
20 |
-
"5": "n
|
21 |
-
"6": "n
|
22 |
-
"7": "n
|
23 |
-
"8": "n
|
24 |
-
"9": "n
|
25 |
-
"10": "n
|
26 |
-
"11": "n
|
27 |
-
"12": "n
|
28 |
-
"13": "n
|
29 |
-
"14": "n
|
30 |
-
"15": "n
|
31 |
-
"16": "n
|
32 |
-
"17": "n
|
33 |
-
"18": "n
|
34 |
-
"19": "n
|
35 |
-
"20": "n
|
36 |
-
"21": "n
|
37 |
-
"22": "n
|
38 |
-
"23": "n
|
39 |
-
"24": "n
|
40 |
-
"25": "n
|
41 |
-
"26": "n
|
42 |
-
"27": "n
|
43 |
-
"28": "n
|
44 |
-
"29": "n
|
45 |
-
"30": "n
|
46 |
-
"31": "n
|
47 |
-
"32": "n
|
48 |
-
"33": "n
|
49 |
-
"34": "n
|
50 |
-
"35": "n
|
51 |
-
"36": "n
|
52 |
-
"37": "n
|
53 |
-
"38": "n
|
54 |
-
"39": "n
|
55 |
-
"40": "n
|
56 |
-
"41": "n
|
57 |
-
"42": "n
|
58 |
-
"43": "n
|
59 |
-
"44": "n
|
60 |
-
"45": "n
|
61 |
-
"46": "n
|
62 |
-
"47": "n
|
63 |
-
"48": "n
|
64 |
-
"49": "n
|
65 |
-
"50": "n
|
66 |
-
"51": "n
|
67 |
-
"52": "n
|
68 |
-
"53": "n
|
69 |
-
"54": "n
|
70 |
-
"55": "n
|
71 |
-
"56": "p
|
72 |
-
"57": "p
|
73 |
-
"58": "p
|
74 |
-
"59": "p
|
75 |
-
"60": "p
|
76 |
-
"61": "p
|
77 |
-
"62": "p
|
78 |
-
"63": "p
|
79 |
-
"64": "s
|
80 |
-
"65": "s
|
81 |
-
"66": "s
|
82 |
-
"67": "s
|
83 |
-
"68": "v
|
84 |
-
"69": "v
|
85 |
-
"70": "v
|
86 |
-
"71": "v
|
87 |
-
"72": "v
|
88 |
-
"73": "v
|
89 |
-
"74": "v
|
90 |
-
"75": "v
|
91 |
-
"76": "v
|
92 |
-
"77": "v
|
93 |
-
"78": "v
|
94 |
-
"79": "v
|
95 |
-
"80": "v
|
96 |
-
"81": "v
|
97 |
-
"82": "v
|
98 |
-
"83": "v
|
99 |
-
"84": "v
|
100 |
-
"85": "v
|
101 |
-
"86": "v
|
102 |
-
"87": "v
|
103 |
-
"88": "v
|
104 |
-
"89": "v
|
105 |
-
"90": "v
|
106 |
-
"91": "v
|
107 |
-
"92": "v
|
108 |
-
"93": "v
|
109 |
-
"94": "v
|
110 |
-
"95": "v
|
111 |
-
"96": "v
|
112 |
-
"97": "v
|
113 |
-
"98": "v
|
114 |
-
"99": "v
|
115 |
-
"100": "v
|
116 |
-
"101": "v
|
117 |
-
"102": "v
|
118 |
-
"103": "v
|
119 |
-
"104": "v
|
120 |
-
"105": "v
|
121 |
-
"106": "v
|
122 |
-
"107": "v
|
123 |
-
"108": "v
|
124 |
-
"109": "v
|
125 |
-
"110": "v
|
126 |
-
"111": "v
|
127 |
-
"112": "v
|
128 |
-
"113": "v
|
129 |
-
"114": "v
|
130 |
-
"115": "v
|
131 |
-
"116": "v
|
132 |
-
"117": "v
|
133 |
-
"118": "v
|
134 |
-
"119": "v
|
135 |
-
"120": "v
|
136 |
-
"121": "v
|
137 |
-
"122": "v
|
138 |
-
"123": "v
|
139 |
-
"124": "v
|
140 |
-
"125": "v
|
141 |
-
"126": "v
|
142 |
-
"127": "v
|
143 |
-
"128": "v
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 4096,
|
147 |
"label2id": {
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"n
|
204 |
-
"p
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"p
|
212 |
-
"s
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"s
|
216 |
-
"v
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
-
"v
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
@@ -284,7 +284,7 @@
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
-
"transformers_version": "4.
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 23292
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
|
|
11 |
"hidden_act": "gelu",
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
16 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
17 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
18 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
19 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
20 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
21 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
22 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
23 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
24 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
25 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
26 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
27 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
28 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
29 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
30 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
31 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
32 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
33 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
34 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
35 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
36 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
37 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
38 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
39 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
40 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
41 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
42 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
43 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
44 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
45 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
46 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
47 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
48 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
49 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
50 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
51 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
52 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
53 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
54 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
55 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
56 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
57 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
58 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
59 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
60 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
61 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
62 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_",
|
63 |
+
"48": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
64 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
65 |
+
"50": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
66 |
+
"51": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
67 |
+
"52": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
68 |
+
"53": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
69 |
+
"54": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
70 |
+
"55": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
71 |
+
"56": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
72 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
73 |
+
"58": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
74 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
75 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
76 |
+
"61": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
77 |
+
"62": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
78 |
+
"63": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
79 |
+
"64": "s,\u6587\u5b57,*,*,SYM,_",
|
80 |
+
"65": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
81 |
+
"66": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
82 |
+
"67": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
83 |
+
"68": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
84 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
85 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
86 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
87 |
+
"72": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
88 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
89 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
90 |
+
"75": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
91 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
92 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
93 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
94 |
+
"79": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
95 |
+
"80": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
96 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
97 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
98 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
99 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
100 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
101 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
102 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
103 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
104 |
+
"89": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
105 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
106 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
107 |
+
"92": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
108 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
109 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
110 |
+
"95": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
111 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
112 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
113 |
+
"98": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
114 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
115 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
116 |
+
"101": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
117 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
118 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
119 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
120 |
+
"105": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
121 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
122 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
123 |
+
"108": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
124 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
125 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
126 |
+
"111": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
127 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
128 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
129 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
130 |
+
"115": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
131 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
132 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
133 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
134 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
135 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
136 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
137 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
138 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
139 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
140 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
141 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
142 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
143 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 4096,
|
147 |
"label2id": {
|
148 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
162 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
165 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
171 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
178 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
180 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
185 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
190 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
191 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
194 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
195 |
+
"n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_": 47,
|
196 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 48,
|
197 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 49,
|
198 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 50,
|
199 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 51,
|
200 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 52,
|
201 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 53,
|
202 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 54,
|
203 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 55,
|
204 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 56,
|
205 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 57,
|
206 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 58,
|
207 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 59,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 60,
|
209 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 61,
|
210 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 62,
|
211 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 63,
|
212 |
+
"s,\u6587\u5b57,*,*,SYM,_": 64,
|
213 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 65,
|
214 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 66,
|
215 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 67,
|
216 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 68,
|
217 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 69,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 70,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 71,
|
220 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 72,
|
221 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 73,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 74,
|
223 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 75,
|
224 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 76,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 77,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 78,
|
227 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 79,
|
228 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 80,
|
229 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 81,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 82,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 83,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 84,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 85,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 86,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 87,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 88,
|
237 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 89,
|
238 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 90,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 91,
|
240 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 92,
|
241 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 93,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 94,
|
243 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 95,
|
244 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 96,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 97,
|
246 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 98,
|
247 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 99,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 100,
|
249 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 101,
|
250 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 102,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 103,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 104,
|
253 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 105,
|
254 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 106,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 107,
|
256 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 108,
|
257 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 109,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 110,
|
259 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 111,
|
260 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 112,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 113,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 114,
|
263 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 115,
|
264 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 116,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 117,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 118,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 119,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 120,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 121,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 122,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 123,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 124,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 125,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 126,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 127,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 128
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
+
"transformers_version": "4.11.3",
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 23292
|
suparkanbun/models/guwenbert-large.pos/filesize.txt
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
-
pytorch_model.bin
|
2 |
-
guwenbert-large.supar
|
|
|
1 |
+
pytorch_model.bin 1307456848
|
2 |
+
guwenbert-large.supar 1358552571
|
suparkanbun/models/guwenbert-large.pos/guwenbert-large.supar
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:482a135799b79f43a266a9e16df04852840be433bd23058ce7756a0c7e79cd1a
|
3 |
+
size 1358552571
|
suparkanbun/models/guwenbert-large.pos/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc0d5760a0cc8b9832e4555be3292af45d964938321c71ca684c4942f569d1a1
|
3 |
+
size 1307456848
|
suparkanbun/models/guwenbert-large.pos/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-large", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "add_prefix_space": true, "special_tokens_map_file": null, "name_or_path": "ethanyt/guwenbert-large", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/lzh_kyoto.conllu
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96b0cb456a53f665127e5abc54e5addf87d6d2f78ae2b60f86bffca3f1e1e361
|
3 |
+
size 27347302
|
suparkanbun/models/mkmodel.sh
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
#! /bin/sh
|
2 |
-
# pip3 install transformers seqeval datasets supar
|
3 |
-
test -f run_ner.py || curl -LO https://raw.githubusercontent.com/huggingface/transformers/
|
4 |
|
5 |
python3 -c '
|
6 |
from suparkanbun.simplify import simplify
|
@@ -73,13 +73,13 @@ while True:
|
|
73 |
printf("%s\n",$0)>"validPOS.json";
|
74 |
}'
|
75 |
sed 's/^.*"tags":\[//' trainPOS.json | tr '"' '\012' | sort -u | egrep '^[nvps],' > labelPOS.txt
|
76 |
-
if [ ! -
|
77 |
then mkdir -p guwenbert-base.pos
|
78 |
-
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-base --train_file trainPOS.json --validation_file validPOS.json --output_dir guwenbert-base.pos --do_train --do_eval
|
79 |
fi
|
80 |
-
if [ ! -
|
81 |
then mkdir -p guwenbert-large.pos
|
82 |
-
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-large --train_file trainPOS.json --validation_file validPOS.json --output_dir guwenbert-large.pos --do_train --do_eval
|
83 |
fi
|
84 |
|
85 |
nawk '
|
@@ -139,13 +139,13 @@ while True:
|
|
139 |
printf("%s\n",$0)>"validDanku.json";
|
140 |
}'
|
141 |
sed 's/^.*"tags":\[//' trainDanku.json | tr '"' '\012' | sort -u | egrep '^[A-Z]' > labelDanku.txt
|
142 |
-
if [ ! -
|
143 |
then mkdir -p guwenbert-base.danku
|
144 |
-
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-base --train_file trainDanku.json --validation_file validDanku.json --output_dir guwenbert-base.danku --do_train --do_eval
|
145 |
fi
|
146 |
-
if [ ! -
|
147 |
then mkdir -p guwenbert-large.danku
|
148 |
-
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-large --train_file trainDanku.json --validation_file validDanku.json --output_dir guwenbert-large.danku --do_train --do_eval
|
149 |
fi
|
150 |
|
151 |
python3 -c '
|
@@ -213,13 +213,13 @@ while True:
|
|
213 |
else
|
214 |
printf("%s\n",$0)>>"validPOS.json";
|
215 |
}'
|
216 |
-
if [ ! -
|
217 |
then mkdir -p roberta-classical-chinese-base-char.pos
|
218 |
-
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-base-char --train_file trainPOS.json --validation_file validPOS.json --output_dir roberta-classical-chinese-base-char.pos --do_train --do_eval
|
219 |
fi
|
220 |
-
if [ ! -
|
221 |
then mkdir -p roberta-classical-chinese-large-char.pos
|
222 |
-
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-large-char --train_file trainPOS.json --validation_file validPOS.json --output_dir roberta-classical-chinese-large-char.pos --do_train --do_eval
|
223 |
fi
|
224 |
|
225 |
nawk '
|
@@ -278,13 +278,13 @@ while True:
|
|
278 |
else
|
279 |
printf("%s\n",$0)>>"validDanku.json";
|
280 |
}'
|
281 |
-
if [ ! -
|
282 |
then mkdir -p roberta-classical-chinese-base-char.danku
|
283 |
-
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-base-char --train_file trainDanku.json --validation_file validDanku.json --output_dir roberta-classical-chinese-base-char.danku --do_train --do_eval
|
284 |
fi
|
285 |
-
if [ ! -
|
286 |
then mkdir -p roberta-classical-chinese-large-char.danku
|
287 |
-
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-large-char --train_file trainDanku.json --validation_file validDanku.json --output_dir roberta-classical-chinese-large-char.danku --do_train --do_eval
|
288 |
fi
|
289 |
|
290 |
nawk '
|
@@ -294,13 +294,13 @@ nawk '
|
|
294 |
else
|
295 |
printf("%s\n",$0)>"validPOS.json";
|
296 |
}' traditionalPOS.json
|
297 |
-
if [ ! -
|
298 |
then mkdir -p sikubert.pos
|
299 |
-
python3 run_ner.py --model_name_or_path SIKU-BERT/sikubert --train_file trainPOS.json --validation_file validPOS.json --output_dir sikubert.pos --do_train --do_eval
|
300 |
fi
|
301 |
-
if [ ! -
|
302 |
then mkdir -p sikuroberta.pos
|
303 |
-
python3 run_ner.py --model_name_or_path SIKU-BERT/sikuroberta --train_file trainPOS.json --validation_file validPOS.json --output_dir sikuroberta.pos --do_train --do_eval
|
304 |
fi
|
305 |
|
306 |
nawk '
|
@@ -329,13 +329,13 @@ nawk '
|
|
329 |
else
|
330 |
printf("%s\n",$0)>"validDanku.json";
|
331 |
}' traditionalDanku.json
|
332 |
-
if [ ! -
|
333 |
then mkdir -p sikubert.danku
|
334 |
-
python3 run_ner.py --model_name_or_path SIKU-BERT/sikubert --train_file trainDanku.json --validation_file validDanku.json --output_dir sikubert.danku --do_train --do_eval
|
335 |
fi
|
336 |
-
if [ ! -
|
337 |
then mkdir -p sikuroberta.danku
|
338 |
-
python3 run_ner.py --model_name_or_path SIKU-BERT/sikuroberta --train_file trainDanku.json --validation_file validDanku.json --output_dir sikuroberta.danku --do_train --do_eval
|
339 |
fi
|
340 |
|
341 |
exit 0
|
|
|
1 |
#! /bin/sh
|
2 |
+
# pip3 install 'transformers>=4.10.0' seqeval datasets supar==1.1.3
|
3 |
+
test -f run_ner.py || curl -LO https://raw.githubusercontent.com/huggingface/transformers/v`pip3 list | sed -n 's/^transformers *\([^ ]*\) *$/\1/p'`/examples/pytorch/token-classification/run_ner.py
|
4 |
|
5 |
python3 -c '
|
6 |
from suparkanbun.simplify import simplify
|
|
|
73 |
printf("%s\n",$0)>"validPOS.json";
|
74 |
}'
|
75 |
sed 's/^.*"tags":\[//' trainPOS.json | tr '"' '\012' | sort -u | egrep '^[nvps],' > labelPOS.txt
|
76 |
+
if [ ! -f guwenbert-base.pos/pytorch_model.bin ]
|
77 |
then mkdir -p guwenbert-base.pos
|
78 |
+
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-base --train_file trainPOS.json --validation_file validPOS.json --output_dir guwenbert-base.pos --do_train --do_eval --overwrite_output_dir
|
79 |
fi
|
80 |
+
if [ ! -f guwenbert-large.pos/pytorch_model.bin ]
|
81 |
then mkdir -p guwenbert-large.pos
|
82 |
+
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-large --train_file trainPOS.json --validation_file validPOS.json --output_dir guwenbert-large.pos --do_train --do_eval --overwrite_output_dir --per_device_train_batch_size=4 --per_device_eval_batch_size=4
|
83 |
fi
|
84 |
|
85 |
nawk '
|
|
|
139 |
printf("%s\n",$0)>"validDanku.json";
|
140 |
}'
|
141 |
sed 's/^.*"tags":\[//' trainDanku.json | tr '"' '\012' | sort -u | egrep '^[A-Z]' > labelDanku.txt
|
142 |
+
if [ ! -f guwenbert-base.danku/pytorch_model.bin ]
|
143 |
then mkdir -p guwenbert-base.danku
|
144 |
+
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-base --train_file trainDanku.json --validation_file validDanku.json --output_dir guwenbert-base.danku --do_train --do_eval --overwrite_output_dir
|
145 |
fi
|
146 |
+
if [ ! -f guwenbert-large.danku/pytorch_model.bin ]
|
147 |
then mkdir -p guwenbert-large.danku
|
148 |
+
python3 run_ner.py --model_name_or_path ethanyt/guwenbert-large --train_file trainDanku.json --validation_file validDanku.json --output_dir guwenbert-large.danku --do_train --do_eval --overwrite_output_dir --per_device_train_batch_size=4 --per_device_eval_batch_size=4
|
149 |
fi
|
150 |
|
151 |
python3 -c '
|
|
|
213 |
else
|
214 |
printf("%s\n",$0)>>"validPOS.json";
|
215 |
}'
|
216 |
+
if [ ! -f roberta-classical-chinese-base-char.pos/pytorch_model.bin ]
|
217 |
then mkdir -p roberta-classical-chinese-base-char.pos
|
218 |
+
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-base-char --train_file trainPOS.json --validation_file validPOS.json --output_dir roberta-classical-chinese-base-char.pos --do_train --do_eval --overwrite_output_dir
|
219 |
fi
|
220 |
+
if [ ! -f roberta-classical-chinese-large-char.pos/pytorch_model.bin ]
|
221 |
then mkdir -p roberta-classical-chinese-large-char.pos
|
222 |
+
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-large-char --train_file trainPOS.json --validation_file validPOS.json --output_dir roberta-classical-chinese-large-char.pos --do_train --do_eval --overwrite_output_dir --per_device_train_batch_size=4 --per_device_eval_batch_size=4
|
223 |
fi
|
224 |
|
225 |
nawk '
|
|
|
278 |
else
|
279 |
printf("%s\n",$0)>>"validDanku.json";
|
280 |
}'
|
281 |
+
if [ ! -f roberta-classical-chinese-base-char.danku/pytorch_model.bin ]
|
282 |
then mkdir -p roberta-classical-chinese-base-char.danku
|
283 |
+
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-base-char --train_file trainDanku.json --validation_file validDanku.json --output_dir roberta-classical-chinese-base-char.danku --do_train --do_eval --overwrite_output_dir
|
284 |
fi
|
285 |
+
if [ ! -f roberta-classical-chinese-large-char.danku/pytorch_model.bin ]
|
286 |
then mkdir -p roberta-classical-chinese-large-char.danku
|
287 |
+
python3 run_ner.py --model_name_or_path KoichiYasuoka/roberta-classical-chinese-large-char --train_file trainDanku.json --validation_file validDanku.json --output_dir roberta-classical-chinese-large-char.danku --do_train --do_eval --overwrite_output_dir --per_device_train_batch_size=4 --per_device_eval_batch_size=4
|
288 |
fi
|
289 |
|
290 |
nawk '
|
|
|
294 |
else
|
295 |
printf("%s\n",$0)>"validPOS.json";
|
296 |
}' traditionalPOS.json
|
297 |
+
if [ ! -f sikubert.pos/pytorch_model.bin ]
|
298 |
then mkdir -p sikubert.pos
|
299 |
+
python3 run_ner.py --model_name_or_path SIKU-BERT/sikubert --train_file trainPOS.json --validation_file validPOS.json --output_dir sikubert.pos --do_train --do_eval --overwrite_output_dir
|
300 |
fi
|
301 |
+
if [ ! -f sikuroberta.pos/pytorch_model.bin ]
|
302 |
then mkdir -p sikuroberta.pos
|
303 |
+
python3 run_ner.py --model_name_or_path SIKU-BERT/sikuroberta --train_file trainPOS.json --validation_file validPOS.json --output_dir sikuroberta.pos --do_train --do_eval --overwrite_output_dir
|
304 |
fi
|
305 |
|
306 |
nawk '
|
|
|
329 |
else
|
330 |
printf("%s\n",$0)>"validDanku.json";
|
331 |
}' traditionalDanku.json
|
332 |
+
if [ ! -f sikubert.danku/pytorch_model.bin ]
|
333 |
then mkdir -p sikubert.danku
|
334 |
+
python3 run_ner.py --model_name_or_path SIKU-BERT/sikubert --train_file trainDanku.json --validation_file validDanku.json --output_dir sikubert.danku --do_train --do_eval --overwrite_output_dir
|
335 |
fi
|
336 |
+
if [ ! -f sikuroberta.danku/pytorch_model.bin ]
|
337 |
then mkdir -p sikuroberta.danku
|
338 |
+
python3 run_ner.py --model_name_or_path SIKU-BERT/sikuroberta --train_file trainDanku.json --validation_file validDanku.json --output_dir sikuroberta.danku --do_train --do_eval --overwrite_output_dir
|
339 |
fi
|
340 |
|
341 |
exit 0
|
suparkanbun/models/roberta-classical-chinese-base-char.danku/config.json
CHANGED
@@ -5,6 +5,7 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
@@ -12,22 +13,22 @@
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
-
"0": "
|
16 |
-
"1": "
|
17 |
-
"2": "
|
18 |
-
"3": "
|
19 |
-
"4": "
|
20 |
-
"5": "
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 3072,
|
24 |
"label2id": {
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
@@ -38,7 +39,7 @@
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
-
"transformers_version": "4.
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 26318
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
11 |
"gradient_checkpointing": false,
|
|
|
13 |
"hidden_dropout_prob": 0.1,
|
14 |
"hidden_size": 768,
|
15 |
"id2label": {
|
16 |
+
"0": "B",
|
17 |
+
"1": "E",
|
18 |
+
"2": "E2",
|
19 |
+
"3": "E3",
|
20 |
+
"4": "M",
|
21 |
+
"5": "S"
|
22 |
},
|
23 |
"initializer_range": 0.02,
|
24 |
"intermediate_size": 3072,
|
25 |
"label2id": {
|
26 |
+
"B": 0,
|
27 |
+
"E": 1,
|
28 |
+
"E2": 2,
|
29 |
+
"E3": 3,
|
30 |
+
"M": 4,
|
31 |
+
"S": 5
|
32 |
},
|
33 |
"layer_norm_eps": 1e-05,
|
34 |
"max_position_embeddings": 514,
|
|
|
39 |
"position_embedding_type": "absolute",
|
40 |
"tokenizer_class": "BertTokenizer",
|
41 |
"torch_dtype": "float32",
|
42 |
+
"transformers_version": "4.11.3",
|
43 |
"type_vocab_size": 1,
|
44 |
"use_cache": true,
|
45 |
"vocab_size": 26318
|
suparkanbun/models/roberta-classical-chinese-base-char.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 422761232
|
suparkanbun/models/roberta-classical-chinese-base-char.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4f75f8201c4ddae696bef91c824de7a851cdc7fbf3243832fa65425e3556c99
|
3 |
+
size 422761232
|
suparkanbun/models/roberta-classical-chinese-base-char.danku/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "model_max_length": 512, "do_basic_tokenize": true, "never_split": null, "add_prefix_space": true, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-base-char", "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/roberta-classical-chinese-large-char.danku/config.json
CHANGED
@@ -5,6 +5,7 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
@@ -12,22 +13,22 @@
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
-
"0": "
|
16 |
-
"1": "
|
17 |
-
"2": "
|
18 |
-
"3": "
|
19 |
-
"4": "
|
20 |
-
"5": "
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 4096,
|
24 |
"label2id": {
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
},
|
32 |
"layer_norm_eps": 1e-05,
|
33 |
"max_position_embeddings": 514,
|
@@ -38,7 +39,7 @@
|
|
38 |
"position_embedding_type": "absolute",
|
39 |
"tokenizer_class": "BertTokenizer",
|
40 |
"torch_dtype": "float32",
|
41 |
-
"transformers_version": "4.
|
42 |
"type_vocab_size": 1,
|
43 |
"use_cache": true,
|
44 |
"vocab_size": 26318
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
11 |
"gradient_checkpointing": false,
|
|
|
13 |
"hidden_dropout_prob": 0.1,
|
14 |
"hidden_size": 1024,
|
15 |
"id2label": {
|
16 |
+
"0": "B",
|
17 |
+
"1": "E",
|
18 |
+
"2": "E2",
|
19 |
+
"3": "E3",
|
20 |
+
"4": "M",
|
21 |
+
"5": "S"
|
22 |
},
|
23 |
"initializer_range": 0.02,
|
24 |
"intermediate_size": 4096,
|
25 |
"label2id": {
|
26 |
+
"B": 0,
|
27 |
+
"E": 1,
|
28 |
+
"E2": 2,
|
29 |
+
"E3": 3,
|
30 |
+
"M": 4,
|
31 |
+
"S": 5
|
32 |
},
|
33 |
"layer_norm_eps": 1e-05,
|
34 |
"max_position_embeddings": 514,
|
|
|
39 |
"position_embedding_type": "absolute",
|
40 |
"tokenizer_class": "BertTokenizer",
|
41 |
"torch_dtype": "float32",
|
42 |
+
"transformers_version": "4.11.3",
|
43 |
"type_vocab_size": 1,
|
44 |
"use_cache": true,
|
45 |
"vocab_size": 26318
|
suparkanbun/models/roberta-classical-chinese-large-char.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 1319347026
|
suparkanbun/models/roberta-classical-chinese-large-char.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b58082715c5ad717f2404990fbe7a38aa220753e9ad52877b4c378a09ff5345b
|
3 |
+
size 1319347026
|
suparkanbun/models/roberta-classical-chinese-large-char.danku/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "do_basic_tokenize": true, "never_split": null, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-large-char", "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "model_max_length": 512, "do_basic_tokenize": true, "never_split": null, "add_prefix_space": true, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-large-char", "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/roberta-classical-chinese-large-char.pos/config.json
CHANGED
@@ -5,6 +5,7 @@
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
@@ -12,268 +13,268 @@
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 1024,
|
14 |
"id2label": {
|
15 |
-
"0": "n
|
16 |
-
"1": "n
|
17 |
-
"2": "n
|
18 |
-
"3": "n
|
19 |
-
"4": "n
|
20 |
-
"5": "n
|
21 |
-
"6": "n
|
22 |
-
"7": "n
|
23 |
-
"8": "n
|
24 |
-
"9": "n
|
25 |
-
"10": "n
|
26 |
-
"11": "n
|
27 |
-
"12": "n
|
28 |
-
"13": "n
|
29 |
-
"14": "n
|
30 |
-
"15": "n
|
31 |
-
"16": "n
|
32 |
-
"17": "n
|
33 |
-
"18": "n
|
34 |
-
"19": "n
|
35 |
-
"20": "n
|
36 |
-
"21": "n
|
37 |
-
"22": "n
|
38 |
-
"23": "n
|
39 |
-
"24": "n
|
40 |
-
"25": "n
|
41 |
-
"26": "n
|
42 |
-
"27": "n
|
43 |
-
"28": "n
|
44 |
-
"29": "n
|
45 |
-
"30": "n
|
46 |
-
"31": "n
|
47 |
-
"32": "n
|
48 |
-
"33": "n
|
49 |
-
"34": "n
|
50 |
-
"35": "n
|
51 |
-
"36": "n
|
52 |
-
"37": "n
|
53 |
-
"38": "n
|
54 |
-
"39": "n
|
55 |
-
"40": "n
|
56 |
-
"41": "n
|
57 |
-
"42": "n
|
58 |
-
"43": "n
|
59 |
-
"44": "n
|
60 |
-
"45": "n
|
61 |
-
"46": "n
|
62 |
-
"47": "n
|
63 |
-
"48": "n
|
64 |
-
"49": "n
|
65 |
-
"50": "n
|
66 |
-
"51": "n
|
67 |
-
"52": "n
|
68 |
-
"53": "n
|
69 |
-
"54": "n
|
70 |
-
"55": "n
|
71 |
-
"56": "p
|
72 |
-
"57": "p
|
73 |
-
"58": "p
|
74 |
-
"59": "p
|
75 |
-
"60": "p
|
76 |
-
"61": "p
|
77 |
-
"62": "p
|
78 |
-
"63": "p
|
79 |
-
"64": "s
|
80 |
-
"65": "s
|
81 |
-
"66": "s
|
82 |
-
"67": "s
|
83 |
-
"68": "v
|
84 |
-
"69": "v
|
85 |
-
"70": "v
|
86 |
-
"71": "v
|
87 |
-
"72": "v
|
88 |
-
"73": "v
|
89 |
-
"74": "v
|
90 |
-
"75": "v
|
91 |
-
"76": "v
|
92 |
-
"77": "v
|
93 |
-
"78": "v
|
94 |
-
"79": "v
|
95 |
-
"80": "v
|
96 |
-
"81": "v
|
97 |
-
"82": "v
|
98 |
-
"83": "v
|
99 |
-
"84": "v
|
100 |
-
"85": "v
|
101 |
-
"86": "v
|
102 |
-
"87": "v
|
103 |
-
"88": "v
|
104 |
-
"89": "v
|
105 |
-
"90": "v
|
106 |
-
"91": "v
|
107 |
-
"92": "v
|
108 |
-
"93": "v
|
109 |
-
"94": "v
|
110 |
-
"95": "v
|
111 |
-
"96": "v
|
112 |
-
"97": "v
|
113 |
-
"98": "v
|
114 |
-
"99": "v
|
115 |
-
"100": "v
|
116 |
-
"101": "v
|
117 |
-
"102": "v
|
118 |
-
"103": "v
|
119 |
-
"104": "v
|
120 |
-
"105": "v
|
121 |
-
"106": "v
|
122 |
-
"107": "v
|
123 |
-
"108": "v
|
124 |
-
"109": "v
|
125 |
-
"110": "v
|
126 |
-
"111": "v
|
127 |
-
"112": "v
|
128 |
-
"113": "v
|
129 |
-
"114": "v
|
130 |
-
"115": "v
|
131 |
-
"116": "v
|
132 |
-
"117": "v
|
133 |
-
"118": "v
|
134 |
-
"119": "v
|
135 |
-
"120": "v
|
136 |
-
"121": "v
|
137 |
-
"122": "v
|
138 |
-
"123": "v
|
139 |
-
"124": "v
|
140 |
-
"125": "v
|
141 |
-
"126": "v
|
142 |
-
"127": "v
|
143 |
-
"128": "v
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 4096,
|
147 |
"label2id": {
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"n
|
204 |
-
"p
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"p
|
212 |
-
"s
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"s
|
216 |
-
"v
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
-
"v
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
@@ -284,7 +285,7 @@
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
-
"transformers_version": "4.
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 26318
|
|
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
"eos_token_id": 2,
|
10 |
"finetuning_task": "ner",
|
11 |
"gradient_checkpointing": false,
|
|
|
13 |
"hidden_dropout_prob": 0.1,
|
14 |
"hidden_size": 1024,
|
15 |
"id2label": {
|
16 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
17 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
18 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
19 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
20 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
21 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
22 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
23 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
24 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
25 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
26 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
27 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
28 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
29 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
30 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
31 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
32 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
33 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
34 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
35 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
36 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
37 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
38 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
39 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
40 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
41 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
42 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
43 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
44 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
45 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
46 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
47 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
48 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
49 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
50 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
51 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
52 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
53 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
54 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
55 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
56 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
57 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
58 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
59 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
60 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
61 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
62 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
63 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_",
|
64 |
+
"48": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
65 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
66 |
+
"50": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
67 |
+
"51": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
68 |
+
"52": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
69 |
+
"53": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
70 |
+
"54": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
71 |
+
"55": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
72 |
+
"56": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
73 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
74 |
+
"58": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
75 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
76 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
77 |
+
"61": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
78 |
+
"62": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
79 |
+
"63": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
80 |
+
"64": "s,\u6587\u5b57,*,*,SYM,_",
|
81 |
+
"65": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
82 |
+
"66": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
83 |
+
"67": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
84 |
+
"68": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
85 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
86 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
87 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
88 |
+
"72": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
89 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
90 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
91 |
+
"75": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
92 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
93 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
94 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
95 |
+
"79": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
96 |
+
"80": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
97 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
98 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
99 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
100 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
101 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
102 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
103 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
104 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
105 |
+
"89": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
106 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
107 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
108 |
+
"92": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
109 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
110 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
111 |
+
"95": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
112 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
113 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
114 |
+
"98": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
115 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
116 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
117 |
+
"101": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
118 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
119 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
120 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
121 |
+
"105": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
122 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
123 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
124 |
+
"108": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
125 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
126 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
127 |
+
"111": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
128 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
129 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
130 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
131 |
+
"115": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
132 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
133 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
134 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
135 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
136 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
137 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
138 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
139 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
140 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
141 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
142 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
143 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
144 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
145 |
},
|
146 |
"initializer_range": 0.02,
|
147 |
"intermediate_size": 4096,
|
148 |
"label2id": {
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
162 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
165 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
171 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
178 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
180 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
185 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
190 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
191 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
194 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
195 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
196 |
+
"n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_": 47,
|
197 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 48,
|
198 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 49,
|
199 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 50,
|
200 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 51,
|
201 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 52,
|
202 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 53,
|
203 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 54,
|
204 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 55,
|
205 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 56,
|
206 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 57,
|
207 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 58,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 59,
|
209 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 60,
|
210 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 61,
|
211 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 62,
|
212 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 63,
|
213 |
+
"s,\u6587\u5b57,*,*,SYM,_": 64,
|
214 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 65,
|
215 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 66,
|
216 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 67,
|
217 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 68,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 69,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 70,
|
220 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 71,
|
221 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 72,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 73,
|
223 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 74,
|
224 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 75,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 76,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 77,
|
227 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 78,
|
228 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 79,
|
229 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 80,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 81,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 82,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 83,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 84,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 85,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 86,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 87,
|
237 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 88,
|
238 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 89,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 90,
|
240 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 91,
|
241 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 92,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 93,
|
243 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 94,
|
244 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 95,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 96,
|
246 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 97,
|
247 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 98,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 99,
|
249 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 100,
|
250 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 101,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 102,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 103,
|
253 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 104,
|
254 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 105,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 106,
|
256 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 107,
|
257 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 108,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 109,
|
259 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 110,
|
260 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 111,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 112,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 113,
|
263 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 114,
|
264 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 115,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 116,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 117,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 118,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 119,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 120,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 121,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 122,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 123,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 124,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 125,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 126,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 127,
|
277 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 128
|
278 |
},
|
279 |
"layer_norm_eps": 1e-05,
|
280 |
"max_position_embeddings": 514,
|
|
|
285 |
"position_embedding_type": "absolute",
|
286 |
"tokenizer_class": "BertTokenizer",
|
287 |
"torch_dtype": "float32",
|
288 |
+
"transformers_version": "4.11.3",
|
289 |
"type_vocab_size": 1,
|
290 |
"use_cache": true,
|
291 |
"vocab_size": 26318
|
suparkanbun/models/roberta-classical-chinese-large-char.pos/filesize.txt
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
-
pytorch_model.bin
|
2 |
-
roberta-classical-chinese-large-char.supar
|
|
|
1 |
+
pytorch_model.bin 1319851346
|
2 |
+
roberta-classical-chinese-large-char.supar 1371926646
|
suparkanbun/models/roberta-classical-chinese-large-char.pos/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c282677ea17ec6bb123cf9abe7d9cf2c271ca7ccdacd896b35013fdcd91c204
|
3 |
+
size 1319851346
|
suparkanbun/models/roberta-classical-chinese-large-char.pos/roberta-classical-chinese-large-char.supar
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b021ab26a13e1904800e58855513b121d4b356d2310aa3abd7f2ec7d0141340
|
3 |
+
size 1371926646
|
suparkanbun/models/roberta-classical-chinese-large-char.pos/tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "do_basic_tokenize": true, "never_split": null, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-large-char", "tokenizer_class": "BertTokenizer"}
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "model_max_length": 512, "do_basic_tokenize": true, "never_split": null, "add_prefix_space": true, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-large-char", "tokenizer_class": "BertTokenizer"}
|
suparkanbun/models/sikubert.danku/config.json
CHANGED
@@ -4,6 +4,7 @@
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
|
|
7 |
"directionality": "bidi",
|
8 |
"finetuning_task": "ner",
|
9 |
"gradient_checkpointing": false,
|
@@ -11,22 +12,22 @@
|
|
11 |
"hidden_dropout_prob": 0.1,
|
12 |
"hidden_size": 768,
|
13 |
"id2label": {
|
14 |
-
"0": "
|
15 |
-
"1": "
|
16 |
-
"2": "
|
17 |
-
"3": "
|
18 |
-
"4": "
|
19 |
-
"5": "
|
20 |
},
|
21 |
"initializer_range": 0.02,
|
22 |
"intermediate_size": 3072,
|
23 |
"label2id": {
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
},
|
31 |
"layer_norm_eps": 1e-12,
|
32 |
"max_position_embeddings": 512,
|
@@ -41,7 +42,7 @@
|
|
41 |
"pooler_type": "first_token_transform",
|
42 |
"position_embedding_type": "absolute",
|
43 |
"torch_dtype": "float32",
|
44 |
-
"transformers_version": "4.
|
45 |
"type_vocab_size": 2,
|
46 |
"use_cache": true,
|
47 |
"vocab_size": 29791
|
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
"directionality": "bidi",
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "B",
|
16 |
+
"1": "E",
|
17 |
+
"2": "E2",
|
18 |
+
"3": "E3",
|
19 |
+
"4": "M",
|
20 |
+
"5": "S"
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 3072,
|
24 |
"label2id": {
|
25 |
+
"B": 0,
|
26 |
+
"E": 1,
|
27 |
+
"E2": 2,
|
28 |
+
"E3": 3,
|
29 |
+
"M": 4,
|
30 |
+
"S": 5
|
31 |
},
|
32 |
"layer_norm_eps": 1e-12,
|
33 |
"max_position_embeddings": 512,
|
|
|
42 |
"pooler_type": "first_token_transform",
|
43 |
"position_embedding_type": "absolute",
|
44 |
"torch_dtype": "float32",
|
45 |
+
"transformers_version": "4.11.3",
|
46 |
"type_vocab_size": 2,
|
47 |
"use_cache": true,
|
48 |
"vocab_size": 29791
|
suparkanbun/models/sikubert.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 433426003
|
suparkanbun/models/sikubert.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dbf6a91ccf5b5e208afad86ac64c62178c335e8ca7b1625fc14c82acae113a6
|
3 |
+
size 433426003
|
suparkanbun/models/sikubert.pos/config.json
CHANGED
@@ -4,6 +4,7 @@
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
|
|
7 |
"directionality": "bidi",
|
8 |
"finetuning_task": "ner",
|
9 |
"gradient_checkpointing": false,
|
@@ -11,268 +12,268 @@
|
|
11 |
"hidden_dropout_prob": 0.1,
|
12 |
"hidden_size": 768,
|
13 |
"id2label": {
|
14 |
-
"0": "n
|
15 |
-
"1": "n
|
16 |
-
"2": "n
|
17 |
-
"3": "n
|
18 |
-
"4": "n
|
19 |
-
"5": "n
|
20 |
-
"6": "n
|
21 |
-
"7": "n
|
22 |
-
"8": "n
|
23 |
-
"9": "n
|
24 |
-
"10": "n
|
25 |
-
"11": "n
|
26 |
-
"12": "n
|
27 |
-
"13": "n
|
28 |
-
"14": "n
|
29 |
-
"15": "n
|
30 |
-
"16": "n
|
31 |
-
"17": "n
|
32 |
-
"18": "n
|
33 |
-
"19": "n
|
34 |
-
"20": "n
|
35 |
-
"21": "n
|
36 |
-
"22": "n
|
37 |
-
"23": "n
|
38 |
-
"24": "n
|
39 |
-
"25": "n
|
40 |
-
"26": "n
|
41 |
-
"27": "n
|
42 |
-
"28": "n
|
43 |
-
"29": "n
|
44 |
-
"30": "n
|
45 |
-
"31": "n
|
46 |
-
"32": "n
|
47 |
-
"33": "n
|
48 |
-
"34": "n
|
49 |
-
"35": "n
|
50 |
-
"36": "n
|
51 |
-
"37": "n
|
52 |
-
"38": "n
|
53 |
-
"39": "n
|
54 |
-
"40": "n
|
55 |
-
"41": "n
|
56 |
-
"42": "n
|
57 |
-
"43": "n
|
58 |
-
"44": "n
|
59 |
-
"45": "n
|
60 |
-
"46": "n
|
61 |
-
"47": "n
|
62 |
-
"48": "n
|
63 |
-
"49": "n
|
64 |
-
"50": "n
|
65 |
-
"51": "n
|
66 |
-
"52": "n
|
67 |
-
"53": "n
|
68 |
-
"54": "n
|
69 |
-
"55": "n
|
70 |
-
"56": "p
|
71 |
-
"57": "p
|
72 |
-
"58": "p
|
73 |
-
"59": "p
|
74 |
-
"60": "p
|
75 |
-
"61": "p
|
76 |
-
"62": "p
|
77 |
-
"63": "p
|
78 |
-
"64": "s
|
79 |
-
"65": "s
|
80 |
-
"66": "s
|
81 |
-
"67": "s
|
82 |
-
"68": "v
|
83 |
-
"69": "v
|
84 |
-
"70": "v
|
85 |
-
"71": "v
|
86 |
-
"72": "v
|
87 |
-
"73": "v
|
88 |
-
"74": "v
|
89 |
-
"75": "v
|
90 |
-
"76": "v
|
91 |
-
"77": "v
|
92 |
-
"78": "v
|
93 |
-
"79": "v
|
94 |
-
"80": "v
|
95 |
-
"81": "v
|
96 |
-
"82": "v
|
97 |
-
"83": "v
|
98 |
-
"84": "v
|
99 |
-
"85": "v
|
100 |
-
"86": "v
|
101 |
-
"87": "v
|
102 |
-
"88": "v
|
103 |
-
"89": "v
|
104 |
-
"90": "v
|
105 |
-
"91": "v
|
106 |
-
"92": "v
|
107 |
-
"93": "v
|
108 |
-
"94": "v
|
109 |
-
"95": "v
|
110 |
-
"96": "v
|
111 |
-
"97": "v
|
112 |
-
"98": "v
|
113 |
-
"99": "v
|
114 |
-
"100": "v
|
115 |
-
"101": "v
|
116 |
-
"102": "v
|
117 |
-
"103": "v
|
118 |
-
"104": "v
|
119 |
-
"105": "v
|
120 |
-
"106": "v
|
121 |
-
"107": "v
|
122 |
-
"108": "v
|
123 |
-
"109": "v
|
124 |
-
"110": "v
|
125 |
-
"111": "v
|
126 |
-
"112": "v
|
127 |
-
"113": "v
|
128 |
-
"114": "v
|
129 |
-
"115": "v
|
130 |
-
"116": "v
|
131 |
-
"117": "v
|
132 |
-
"118": "v
|
133 |
-
"119": "v
|
134 |
-
"120": "v
|
135 |
-
"121": "v
|
136 |
-
"122": "v
|
137 |
-
"123": "v
|
138 |
-
"124": "v
|
139 |
-
"125": "v
|
140 |
-
"126": "v
|
141 |
-
"127": "v
|
142 |
-
"128": "v
|
143 |
},
|
144 |
"initializer_range": 0.02,
|
145 |
"intermediate_size": 3072,
|
146 |
"label2id": {
|
147 |
-
"n
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"p
|
204 |
-
"p
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"s
|
212 |
-
"s
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"v
|
216 |
-
"v
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
},
|
277 |
"layer_norm_eps": 1e-12,
|
278 |
"max_position_embeddings": 512,
|
@@ -287,7 +288,7 @@
|
|
287 |
"pooler_type": "first_token_transform",
|
288 |
"position_embedding_type": "absolute",
|
289 |
"torch_dtype": "float32",
|
290 |
-
"transformers_version": "4.
|
291 |
"type_vocab_size": 2,
|
292 |
"use_cache": true,
|
293 |
"vocab_size": 29791
|
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
"directionality": "bidi",
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
16 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
17 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
18 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
19 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
20 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
21 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
22 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
23 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
24 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
25 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
26 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
27 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
28 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
29 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
30 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
31 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
32 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
33 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
34 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
35 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
36 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
37 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
38 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
39 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
40 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
41 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
42 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
43 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
44 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
45 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
46 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
47 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
48 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
49 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
50 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
51 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
52 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
53 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
54 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
55 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
56 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
57 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
58 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
59 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
60 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
61 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
62 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_",
|
63 |
+
"48": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
64 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
65 |
+
"50": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
66 |
+
"51": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
67 |
+
"52": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
68 |
+
"53": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
69 |
+
"54": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
70 |
+
"55": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
71 |
+
"56": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
72 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
73 |
+
"58": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
74 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
75 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
76 |
+
"61": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
77 |
+
"62": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
78 |
+
"63": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
79 |
+
"64": "s,\u6587\u5b57,*,*,SYM,_",
|
80 |
+
"65": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
81 |
+
"66": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
82 |
+
"67": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
83 |
+
"68": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
84 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
85 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
86 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
87 |
+
"72": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
88 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
89 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
90 |
+
"75": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
91 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
92 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
93 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
94 |
+
"79": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
95 |
+
"80": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
96 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
97 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
98 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
99 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
100 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
101 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
102 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
103 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
104 |
+
"89": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
105 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
106 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
107 |
+
"92": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
108 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
109 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
110 |
+
"95": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
111 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
112 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
113 |
+
"98": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
114 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
115 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
116 |
+
"101": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
117 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
118 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
119 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
120 |
+
"105": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
121 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
122 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
123 |
+
"108": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
124 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
125 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
126 |
+
"111": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
127 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
128 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
129 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
130 |
+
"115": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
131 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
132 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
133 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
134 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
135 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
136 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
137 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
138 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
139 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
140 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
141 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
142 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
143 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 3072,
|
147 |
"label2id": {
|
148 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
162 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
165 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
171 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
178 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
180 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
185 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
190 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
191 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
194 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
195 |
+
"n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_": 47,
|
196 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 48,
|
197 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 49,
|
198 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 50,
|
199 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 51,
|
200 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 52,
|
201 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 53,
|
202 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 54,
|
203 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 55,
|
204 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 56,
|
205 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 57,
|
206 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 58,
|
207 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 59,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 60,
|
209 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 61,
|
210 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 62,
|
211 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 63,
|
212 |
+
"s,\u6587\u5b57,*,*,SYM,_": 64,
|
213 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 65,
|
214 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 66,
|
215 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 67,
|
216 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 68,
|
217 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 69,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 70,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 71,
|
220 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 72,
|
221 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 73,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 74,
|
223 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 75,
|
224 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 76,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 77,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 78,
|
227 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 79,
|
228 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 80,
|
229 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 81,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 82,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 83,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 84,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 85,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 86,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 87,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 88,
|
237 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 89,
|
238 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 90,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 91,
|
240 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 92,
|
241 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 93,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 94,
|
243 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 95,
|
244 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 96,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 97,
|
246 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 98,
|
247 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 99,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 100,
|
249 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 101,
|
250 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 102,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 103,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 104,
|
253 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 105,
|
254 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 106,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 107,
|
256 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 108,
|
257 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 109,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 110,
|
259 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 111,
|
260 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 112,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 113,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 114,
|
263 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 115,
|
264 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 116,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 117,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 118,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 119,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 120,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 121,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 122,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 123,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 124,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 125,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 126,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 127,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 128
|
277 |
},
|
278 |
"layer_norm_eps": 1e-12,
|
279 |
"max_position_embeddings": 512,
|
|
|
288 |
"pooler_type": "first_token_transform",
|
289 |
"position_embedding_type": "absolute",
|
290 |
"torch_dtype": "float32",
|
291 |
+
"transformers_version": "4.11.3",
|
292 |
"type_vocab_size": 2,
|
293 |
"use_cache": true,
|
294 |
"vocab_size": 29791
|
suparkanbun/models/sikubert.pos/filesize.txt
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
-
pytorch_model.bin
|
2 |
-
sikubert.supar
|
|
|
1 |
+
pytorch_model.bin 433804303
|
2 |
+
sikubert.supar 483333500
|
suparkanbun/models/sikubert.pos/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a719911302d7662426d2f3f2c8486b8de1a7a1afbe584fd9b1b1f8ea800b8a8d
|
3 |
+
size 433804303
|
suparkanbun/models/sikubert.pos/sikubert.supar
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bf74bf4c65a9101d5573d4736e93f9d0724258949e4cfd2ccc884bf302f1b27
|
3 |
+
size 483333500
|
suparkanbun/models/sikuroberta.danku/config.json
CHANGED
@@ -4,6 +4,7 @@
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
|
|
7 |
"directionality": "bidi",
|
8 |
"finetuning_task": "ner",
|
9 |
"gradient_checkpointing": false,
|
@@ -11,22 +12,22 @@
|
|
11 |
"hidden_dropout_prob": 0.1,
|
12 |
"hidden_size": 768,
|
13 |
"id2label": {
|
14 |
-
"0": "
|
15 |
-
"1": "
|
16 |
-
"2": "
|
17 |
-
"3": "
|
18 |
-
"4": "
|
19 |
-
"5": "
|
20 |
},
|
21 |
"initializer_range": 0.02,
|
22 |
"intermediate_size": 3072,
|
23 |
"label2id": {
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
},
|
31 |
"layer_norm_eps": 1e-12,
|
32 |
"max_position_embeddings": 512,
|
@@ -41,7 +42,7 @@
|
|
41 |
"pooler_type": "first_token_transform",
|
42 |
"position_embedding_type": "absolute",
|
43 |
"torch_dtype": "float32",
|
44 |
-
"transformers_version": "4.
|
45 |
"type_vocab_size": 2,
|
46 |
"use_cache": true,
|
47 |
"vocab_size": 29791
|
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
"directionality": "bidi",
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "B",
|
16 |
+
"1": "E",
|
17 |
+
"2": "E2",
|
18 |
+
"3": "E3",
|
19 |
+
"4": "M",
|
20 |
+
"5": "S"
|
21 |
},
|
22 |
"initializer_range": 0.02,
|
23 |
"intermediate_size": 3072,
|
24 |
"label2id": {
|
25 |
+
"B": 0,
|
26 |
+
"E": 1,
|
27 |
+
"E2": 2,
|
28 |
+
"E3": 3,
|
29 |
+
"M": 4,
|
30 |
+
"S": 5
|
31 |
},
|
32 |
"layer_norm_eps": 1e-12,
|
33 |
"max_position_embeddings": 512,
|
|
|
42 |
"pooler_type": "first_token_transform",
|
43 |
"position_embedding_type": "absolute",
|
44 |
"torch_dtype": "float32",
|
45 |
+
"transformers_version": "4.11.3",
|
46 |
"type_vocab_size": 2,
|
47 |
"use_cache": true,
|
48 |
"vocab_size": 29791
|
suparkanbun/models/sikuroberta.danku/filesize.txt
CHANGED
@@ -1 +1 @@
|
|
1 |
-
pytorch_model.bin
|
|
|
1 |
+
pytorch_model.bin 433425936
|
suparkanbun/models/sikuroberta.danku/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9362345a401390cd98600a8fddcb7f8d85e14ce5326c00a704d81881f92c45da
|
3 |
+
size 433425936
|
suparkanbun/models/sikuroberta.pos/config.json
CHANGED
@@ -4,6 +4,7 @@
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
|
|
7 |
"directionality": "bidi",
|
8 |
"finetuning_task": "ner",
|
9 |
"gradient_checkpointing": false,
|
@@ -11,268 +12,268 @@
|
|
11 |
"hidden_dropout_prob": 0.1,
|
12 |
"hidden_size": 768,
|
13 |
"id2label": {
|
14 |
-
"0": "n
|
15 |
-
"1": "n
|
16 |
-
"2": "n
|
17 |
-
"3": "n
|
18 |
-
"4": "n
|
19 |
-
"5": "n
|
20 |
-
"6": "n
|
21 |
-
"7": "n
|
22 |
-
"8": "n
|
23 |
-
"9": "n
|
24 |
-
"10": "n
|
25 |
-
"11": "n
|
26 |
-
"12": "n
|
27 |
-
"13": "n
|
28 |
-
"14": "n
|
29 |
-
"15": "n
|
30 |
-
"16": "n
|
31 |
-
"17": "n
|
32 |
-
"18": "n
|
33 |
-
"19": "n
|
34 |
-
"20": "n
|
35 |
-
"21": "n
|
36 |
-
"22": "n
|
37 |
-
"23": "n
|
38 |
-
"24": "n
|
39 |
-
"25": "n
|
40 |
-
"26": "n
|
41 |
-
"27": "n
|
42 |
-
"28": "n
|
43 |
-
"29": "n
|
44 |
-
"30": "n
|
45 |
-
"31": "n
|
46 |
-
"32": "n
|
47 |
-
"33": "n
|
48 |
-
"34": "n
|
49 |
-
"35": "n
|
50 |
-
"36": "n
|
51 |
-
"37": "n
|
52 |
-
"38": "n
|
53 |
-
"39": "n
|
54 |
-
"40": "n
|
55 |
-
"41": "n
|
56 |
-
"42": "n
|
57 |
-
"43": "n
|
58 |
-
"44": "n
|
59 |
-
"45": "n
|
60 |
-
"46": "n
|
61 |
-
"47": "n
|
62 |
-
"48": "n
|
63 |
-
"49": "n
|
64 |
-
"50": "n
|
65 |
-
"51": "n
|
66 |
-
"52": "n
|
67 |
-
"53": "n
|
68 |
-
"54": "n
|
69 |
-
"55": "n
|
70 |
-
"56": "p
|
71 |
-
"57": "p
|
72 |
-
"58": "p
|
73 |
-
"59": "p
|
74 |
-
"60": "p
|
75 |
-
"61": "p
|
76 |
-
"62": "p
|
77 |
-
"63": "p
|
78 |
-
"64": "s
|
79 |
-
"65": "s
|
80 |
-
"66": "s
|
81 |
-
"67": "s
|
82 |
-
"68": "v
|
83 |
-
"69": "v
|
84 |
-
"70": "v
|
85 |
-
"71": "v
|
86 |
-
"72": "v
|
87 |
-
"73": "v
|
88 |
-
"74": "v
|
89 |
-
"75": "v
|
90 |
-
"76": "v
|
91 |
-
"77": "v
|
92 |
-
"78": "v
|
93 |
-
"79": "v
|
94 |
-
"80": "v
|
95 |
-
"81": "v
|
96 |
-
"82": "v
|
97 |
-
"83": "v
|
98 |
-
"84": "v
|
99 |
-
"85": "v
|
100 |
-
"86": "v
|
101 |
-
"87": "v
|
102 |
-
"88": "v
|
103 |
-
"89": "v
|
104 |
-
"90": "v
|
105 |
-
"91": "v
|
106 |
-
"92": "v
|
107 |
-
"93": "v
|
108 |
-
"94": "v
|
109 |
-
"95": "v
|
110 |
-
"96": "v
|
111 |
-
"97": "v
|
112 |
-
"98": "v
|
113 |
-
"99": "v
|
114 |
-
"100": "v
|
115 |
-
"101": "v
|
116 |
-
"102": "v
|
117 |
-
"103": "v
|
118 |
-
"104": "v
|
119 |
-
"105": "v
|
120 |
-
"106": "v
|
121 |
-
"107": "v
|
122 |
-
"108": "v
|
123 |
-
"109": "v
|
124 |
-
"110": "v
|
125 |
-
"111": "v
|
126 |
-
"112": "v
|
127 |
-
"113": "v
|
128 |
-
"114": "v
|
129 |
-
"115": "v
|
130 |
-
"116": "v
|
131 |
-
"117": "v
|
132 |
-
"118": "v
|
133 |
-
"119": "v
|
134 |
-
"120": "v
|
135 |
-
"121": "v
|
136 |
-
"122": "v
|
137 |
-
"123": "v
|
138 |
-
"124": "v
|
139 |
-
"125": "v
|
140 |
-
"126": "v
|
141 |
-
"127": "v
|
142 |
-
"128": "v
|
143 |
},
|
144 |
"initializer_range": 0.02,
|
145 |
"intermediate_size": 3072,
|
146 |
"label2id": {
|
147 |
-
"n
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"p
|
204 |
-
"p
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"s
|
212 |
-
"s
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"v
|
216 |
-
"v
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
},
|
277 |
"layer_norm_eps": 1e-12,
|
278 |
"max_position_embeddings": 512,
|
@@ -287,7 +288,7 @@
|
|
287 |
"pooler_type": "first_token_transform",
|
288 |
"position_embedding_type": "absolute",
|
289 |
"torch_dtype": "float32",
|
290 |
-
"transformers_version": "4.
|
291 |
"type_vocab_size": 2,
|
292 |
"use_cache": true,
|
293 |
"vocab_size": 29791
|
|
|
4 |
"BertForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
"directionality": "bidi",
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
16 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
17 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
18 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
19 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
20 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
21 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
22 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
23 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
24 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
25 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
26 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
27 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
28 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
29 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
30 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
31 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
32 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
33 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
34 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
35 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
36 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
37 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
38 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
39 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
40 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
41 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
42 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
43 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
44 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
45 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
46 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
47 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
48 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
49 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
50 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
51 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
52 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
53 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
54 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
55 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
56 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
57 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
58 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
59 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
60 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
61 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
62 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_",
|
63 |
+
"48": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
64 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
65 |
+
"50": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
66 |
+
"51": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
67 |
+
"52": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
68 |
+
"53": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
69 |
+
"54": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
70 |
+
"55": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
71 |
+
"56": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
72 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
73 |
+
"58": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
74 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
75 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
76 |
+
"61": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
77 |
+
"62": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
78 |
+
"63": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
79 |
+
"64": "s,\u6587\u5b57,*,*,SYM,_",
|
80 |
+
"65": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
81 |
+
"66": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
82 |
+
"67": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
83 |
+
"68": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
84 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
85 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
86 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
87 |
+
"72": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
88 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
89 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
90 |
+
"75": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
91 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
92 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
93 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
94 |
+
"79": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
95 |
+
"80": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
96 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
97 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
98 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
99 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
100 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
101 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
102 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
103 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
104 |
+
"89": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
105 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
106 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
107 |
+
"92": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
108 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
109 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
110 |
+
"95": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
111 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
112 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
113 |
+
"98": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
114 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
115 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
116 |
+
"101": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
117 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
118 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
119 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
120 |
+
"105": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
121 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
122 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
123 |
+
"108": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
124 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
125 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
126 |
+
"111": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
127 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
128 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
129 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
130 |
+
"115": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
131 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
132 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
133 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
134 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
135 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
136 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
137 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
138 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
139 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
140 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
141 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
142 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
143 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 3072,
|
147 |
"label2id": {
|
148 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
162 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
165 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
171 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
178 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
180 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
185 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
190 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
191 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
194 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
195 |
+
"n,\u540d\u8a5e,\u601d\u8003,*,NOUN,_": 47,
|
196 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 48,
|
197 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 49,
|
198 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 50,
|
199 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 51,
|
200 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 52,
|
201 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 53,
|
202 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 54,
|
203 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 55,
|
204 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 56,
|
205 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 57,
|
206 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 58,
|
207 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 59,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 60,
|
209 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 61,
|
210 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 62,
|
211 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 63,
|
212 |
+
"s,\u6587\u5b57,*,*,SYM,_": 64,
|
213 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 65,
|
214 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 66,
|
215 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 67,
|
216 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 68,
|
217 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 69,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 70,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 71,
|
220 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 72,
|
221 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 73,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 74,
|
223 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 75,
|
224 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 76,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 77,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 78,
|
227 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 79,
|
228 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 80,
|
229 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 81,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 82,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 83,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 84,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 85,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 86,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 87,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 88,
|
237 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 89,
|
238 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 90,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 91,
|
240 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 92,
|
241 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 93,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 94,
|
243 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 95,
|
244 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 96,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 97,
|
246 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 98,
|
247 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 99,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 100,
|
249 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 101,
|
250 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 102,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 103,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 104,
|
253 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 105,
|
254 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 106,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 107,
|
256 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 108,
|
257 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 109,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 110,
|
259 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 111,
|
260 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 112,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 113,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 114,
|
263 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 115,
|
264 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 116,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 117,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 118,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 119,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 120,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 121,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 122,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 123,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 124,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 125,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 126,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 127,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 128
|
277 |
},
|
278 |
"layer_norm_eps": 1e-12,
|
279 |
"max_position_embeddings": 512,
|
|
|
288 |
"pooler_type": "first_token_transform",
|
289 |
"position_embedding_type": "absolute",
|
290 |
"torch_dtype": "float32",
|
291 |
+
"transformers_version": "4.11.3",
|
292 |
"type_vocab_size": 2,
|
293 |
"use_cache": true,
|
294 |
"vocab_size": 29791
|
suparkanbun/models/sikuroberta.pos/filesize.txt
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
-
pytorch_model.bin
|
2 |
-
sikuroberta.supar
|
|
|
1 |
+
pytorch_model.bin 433804373
|
2 |
+
sikuroberta.supar 483333519
|
suparkanbun/models/sikuroberta.pos/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c9825e59cb4e096f9a75a103a516fdc64d6758e5c4f5928f70b22f0c7e08a69
|
3 |
+
size 433804373
|
suparkanbun/models/sikuroberta.pos/sikuroberta.supar
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7828222a4aafd7b3f99f5b0a5830f2d95b32bbc2dcaff685e7b413af1369ba4a
|
3 |
+
size 483333519
|