KoichiYasuoka
commited on
Commit
•
5fba8e3
1
Parent(s):
b975e76
model improved
Browse files- config.json +262 -260
- pytorch_model.bin +2 -2
- suparkanbun/models/labelPOS.txt +3 -2
- suparkanbun/models/lzh_kyoto.conllu +2 -2
- tokenizer_config.json +1 -1
config.json
CHANGED
@@ -1,10 +1,10 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "KoichiYasuoka/roberta-classical-chinese-base-char",
|
3 |
"architectures": [
|
4 |
"RobertaForTokenClassification"
|
5 |
],
|
6 |
"attention_probs_dropout_prob": 0.1,
|
7 |
"bos_token_id": 0,
|
|
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
@@ -12,268 +12,270 @@
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
-
"0": "n
|
16 |
-
"1": "n
|
17 |
-
"2": "n
|
18 |
-
"3": "n
|
19 |
-
"4": "n
|
20 |
-
"5": "n
|
21 |
-
"6": "n
|
22 |
-
"7": "n
|
23 |
-
"8": "n
|
24 |
-
"9": "n
|
25 |
-
"10": "n
|
26 |
-
"11": "n
|
27 |
-
"12": "n
|
28 |
-
"13": "n
|
29 |
-
"14": "n
|
30 |
-
"15": "n
|
31 |
-
"16": "n
|
32 |
-
"17": "n
|
33 |
-
"18": "n
|
34 |
-
"19": "n
|
35 |
-
"20": "n
|
36 |
-
"21": "n
|
37 |
-
"22": "n
|
38 |
-
"23": "n
|
39 |
-
"24": "n
|
40 |
-
"25": "n
|
41 |
-
"26": "n
|
42 |
-
"27": "n
|
43 |
-
"28": "n
|
44 |
-
"29": "n
|
45 |
-
"30": "n
|
46 |
-
"31": "n
|
47 |
-
"32": "n
|
48 |
-
"33": "n
|
49 |
-
"34": "n
|
50 |
-
"35": "n
|
51 |
-
"36": "n
|
52 |
-
"37": "n
|
53 |
-
"38": "n
|
54 |
-
"39": "n
|
55 |
-
"40": "n
|
56 |
-
"41": "n
|
57 |
-
"42": "n
|
58 |
-
"43": "n
|
59 |
-
"44": "n
|
60 |
-
"45": "n
|
61 |
-
"46": "n
|
62 |
-
"47": "n
|
63 |
-
"48": "n
|
64 |
-
"49": "n
|
65 |
-
"50": "n
|
66 |
-
"51": "n
|
67 |
-
"52": "n
|
68 |
-
"53": "n
|
69 |
-
"54": "n
|
70 |
-
"55": "n
|
71 |
-
"56": "
|
72 |
-
"57": "p
|
73 |
-
"58": "p
|
74 |
-
"59": "p
|
75 |
-
"60": "p
|
76 |
-
"61": "p
|
77 |
-
"62": "p
|
78 |
-
"63": "p
|
79 |
-
"64": "
|
80 |
-
"65": "s
|
81 |
-
"66": "s
|
82 |
-
"67": "s
|
83 |
-
"68": "
|
84 |
-
"69": "v
|
85 |
-
"70": "v
|
86 |
-
"71": "v
|
87 |
-
"72": "v
|
88 |
-
"73": "v
|
89 |
-
"74": "v
|
90 |
-
"75": "v
|
91 |
-
"76": "v
|
92 |
-
"77": "v
|
93 |
-
"78": "v
|
94 |
-
"79": "v
|
95 |
-
"80": "v
|
96 |
-
"81": "v
|
97 |
-
"82": "v
|
98 |
-
"83": "v
|
99 |
-
"84": "v
|
100 |
-
"85": "v
|
101 |
-
"86": "v
|
102 |
-
"87": "v
|
103 |
-
"88": "v
|
104 |
-
"89": "v
|
105 |
-
"90": "v
|
106 |
-
"91": "v
|
107 |
-
"92": "v
|
108 |
-
"93": "v
|
109 |
-
"94": "v
|
110 |
-
"95": "v
|
111 |
-
"96": "v
|
112 |
-
"97": "v
|
113 |
-
"98": "v
|
114 |
-
"99": "v
|
115 |
-
"100": "v
|
116 |
-
"101": "v
|
117 |
-
"102": "v
|
118 |
-
"103": "v
|
119 |
-
"104": "v
|
120 |
-
"105": "v
|
121 |
-
"106": "v
|
122 |
-
"107": "v
|
123 |
-
"108": "v
|
124 |
-
"109": "v
|
125 |
-
"110": "v
|
126 |
-
"111": "v
|
127 |
-
"112": "v
|
128 |
-
"113": "v
|
129 |
-
"114": "v
|
130 |
-
"115": "v
|
131 |
-
"116": "v
|
132 |
-
"117": "v
|
133 |
-
"118": "v
|
134 |
-
"119": "v
|
135 |
-
"120": "v
|
136 |
-
"121": "v
|
137 |
-
"122": "v
|
138 |
-
"123": "v
|
139 |
-
"124": "v
|
140 |
-
"125": "v
|
141 |
-
"126": "v
|
142 |
-
"127": "v
|
143 |
-
"128": "v
|
|
|
144 |
},
|
145 |
"initializer_range": 0.02,
|
146 |
"intermediate_size": 3072,
|
147 |
"label2id": {
|
148 |
-
"n
|
149 |
-
"n
|
150 |
-
"n
|
151 |
-
"n
|
152 |
-
"n
|
153 |
-
"n
|
154 |
-
"n
|
155 |
-
"n
|
156 |
-
"n
|
157 |
-
"n
|
158 |
-
"n
|
159 |
-
"n
|
160 |
-
"n
|
161 |
-
"n
|
162 |
-
"n
|
163 |
-
"n
|
164 |
-
"n
|
165 |
-
"n
|
166 |
-
"n
|
167 |
-
"n
|
168 |
-
"n
|
169 |
-
"n
|
170 |
-
"n
|
171 |
-
"n
|
172 |
-
"n
|
173 |
-
"n
|
174 |
-
"n
|
175 |
-
"n
|
176 |
-
"n
|
177 |
-
"n
|
178 |
-
"n
|
179 |
-
"n
|
180 |
-
"n
|
181 |
-
"n
|
182 |
-
"n
|
183 |
-
"n
|
184 |
-
"n
|
185 |
-
"n
|
186 |
-
"n
|
187 |
-
"n
|
188 |
-
"n
|
189 |
-
"n
|
190 |
-
"n
|
191 |
-
"n
|
192 |
-
"n
|
193 |
-
"n
|
194 |
-
"n
|
195 |
-
"n
|
196 |
-
"n
|
197 |
-
"n
|
198 |
-
"n
|
199 |
-
"n
|
200 |
-
"n
|
201 |
-
"n
|
202 |
-
"n
|
203 |
-
"n
|
204 |
-
"
|
205 |
-
"p
|
206 |
-
"p
|
207 |
-
"p
|
208 |
-
"p
|
209 |
-
"p
|
210 |
-
"p
|
211 |
-
"p
|
212 |
-
"
|
213 |
-
"s
|
214 |
-
"s
|
215 |
-
"s
|
216 |
-
"
|
217 |
-
"v
|
218 |
-
"v
|
219 |
-
"v
|
220 |
-
"v
|
221 |
-
"v
|
222 |
-
"v
|
223 |
-
"v
|
224 |
-
"v
|
225 |
-
"v
|
226 |
-
"v
|
227 |
-
"v
|
228 |
-
"v
|
229 |
-
"v
|
230 |
-
"v
|
231 |
-
"v
|
232 |
-
"v
|
233 |
-
"v
|
234 |
-
"v
|
235 |
-
"v
|
236 |
-
"v
|
237 |
-
"v
|
238 |
-
"v
|
239 |
-
"v
|
240 |
-
"v
|
241 |
-
"v
|
242 |
-
"v
|
243 |
-
"v
|
244 |
-
"v
|
245 |
-
"v
|
246 |
-
"v
|
247 |
-
"v
|
248 |
-
"v
|
249 |
-
"v
|
250 |
-
"v
|
251 |
-
"v
|
252 |
-
"v
|
253 |
-
"v
|
254 |
-
"v
|
255 |
-
"v
|
256 |
-
"v
|
257 |
-
"v
|
258 |
-
"v
|
259 |
-
"v
|
260 |
-
"v
|
261 |
-
"v
|
262 |
-
"v
|
263 |
-
"v
|
264 |
-
"v
|
265 |
-
"v
|
266 |
-
"v
|
267 |
-
"v
|
268 |
-
"v
|
269 |
-
"v
|
270 |
-
"v
|
271 |
-
"v
|
272 |
-
"v
|
273 |
-
"v
|
274 |
-
"v
|
275 |
-
"v
|
276 |
-
"v
|
|
|
277 |
},
|
278 |
"layer_norm_eps": 1e-05,
|
279 |
"max_position_embeddings": 514,
|
@@ -284,7 +286,7 @@
|
|
284 |
"position_embedding_type": "absolute",
|
285 |
"tokenizer_class": "BertTokenizer",
|
286 |
"torch_dtype": "float32",
|
287 |
-
"transformers_version": "4.
|
288 |
"type_vocab_size": 1,
|
289 |
"use_cache": true,
|
290 |
"vocab_size": 26318
|
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
"RobertaForTokenClassification"
|
4 |
],
|
5 |
"attention_probs_dropout_prob": 0.1,
|
6 |
"bos_token_id": 0,
|
7 |
+
"classifier_dropout": null,
|
8 |
"eos_token_id": 2,
|
9 |
"finetuning_task": "ner",
|
10 |
"gradient_checkpointing": false,
|
|
|
12 |
"hidden_dropout_prob": 0.1,
|
13 |
"hidden_size": 768,
|
14 |
"id2label": {
|
15 |
+
"0": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs",
|
16 |
+
"1": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs",
|
17 |
+
"2": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs",
|
18 |
+
"3": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs",
|
19 |
+
"4": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes",
|
20 |
+
"5": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs",
|
21 |
+
"6": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs",
|
22 |
+
"7": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs",
|
23 |
+
"8": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs",
|
24 |
+
"9": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs",
|
25 |
+
"10": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs",
|
26 |
+
"11": "n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs",
|
27 |
+
"12": "n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem",
|
28 |
+
"13": "n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int",
|
29 |
+
"14": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_",
|
30 |
+
"15": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_",
|
31 |
+
"16": "n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_",
|
32 |
+
"17": "n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_",
|
33 |
+
"18": "n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat",
|
34 |
+
"19": "n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_",
|
35 |
+
"20": "n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_",
|
36 |
+
"21": "n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_",
|
37 |
+
"22": "n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_",
|
38 |
+
"23": "n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs",
|
39 |
+
"24": "n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_",
|
40 |
+
"25": "n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv",
|
41 |
+
"26": "n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur",
|
42 |
+
"27": "n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_",
|
43 |
+
"28": "n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs",
|
44 |
+
"29": "n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_",
|
45 |
+
"30": "n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_",
|
46 |
+
"31": "n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc",
|
47 |
+
"32": "n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_",
|
48 |
+
"33": "n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_",
|
49 |
+
"34": "n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_",
|
50 |
+
"35": "n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_",
|
51 |
+
"36": "n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_",
|
52 |
+
"37": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo",
|
53 |
+
"38": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc",
|
54 |
+
"39": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc",
|
55 |
+
"40": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_",
|
56 |
+
"41": "n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc",
|
57 |
+
"42": "n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_",
|
58 |
+
"43": "n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_",
|
59 |
+
"44": "n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_",
|
60 |
+
"45": "n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_",
|
61 |
+
"46": "n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf",
|
62 |
+
"47": "n,\u540d\u8a5e,\u601d\u8003,\u601d\u8003,NOUN,_",
|
63 |
+
"48": "n,\u540d\u8a5e,\u601d\u8003,\u65b9\u7565,NOUN,_",
|
64 |
+
"49": "n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_",
|
65 |
+
"50": "n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_",
|
66 |
+
"51": "n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_",
|
67 |
+
"52": "n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem",
|
68 |
+
"53": "n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_",
|
69 |
+
"54": "n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord",
|
70 |
+
"55": "n,\u6570\u8a5e,\u6570,*,NUM,_",
|
71 |
+
"56": "n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_",
|
72 |
+
"57": "p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_",
|
73 |
+
"58": "p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_",
|
74 |
+
"59": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_",
|
75 |
+
"60": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_",
|
76 |
+
"61": "p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_",
|
77 |
+
"62": "p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_",
|
78 |
+
"63": "p,\u611f\u5606\u8a5e,*,*,INTJ,_",
|
79 |
+
"64": "p,\u63a5\u5c3e\u8f9e,*,*,PART,_",
|
80 |
+
"65": "s,\u6587\u5b57,*,*,SYM,_",
|
81 |
+
"66": "s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_",
|
82 |
+
"67": "s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_",
|
83 |
+
"68": "s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_",
|
84 |
+
"69": "v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_",
|
85 |
+
"70": "v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_",
|
86 |
+
"71": "v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_",
|
87 |
+
"72": "v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_",
|
88 |
+
"73": "v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_",
|
89 |
+
"74": "v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_",
|
90 |
+
"75": "v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_",
|
91 |
+
"76": "v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg",
|
92 |
+
"77": "v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg",
|
93 |
+
"78": "v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg",
|
94 |
+
"79": "v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg",
|
95 |
+
"80": "v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_",
|
96 |
+
"81": "v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim",
|
97 |
+
"82": "v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf",
|
98 |
+
"83": "v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut",
|
99 |
+
"84": "v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim",
|
100 |
+
"85": "v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres",
|
101 |
+
"86": "v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim",
|
102 |
+
"87": "v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim",
|
103 |
+
"88": "v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim",
|
104 |
+
"89": "v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past",
|
105 |
+
"90": "v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau",
|
106 |
+
"91": "v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_",
|
107 |
+
"92": "v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_",
|
108 |
+
"93": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp",
|
109 |
+
"94": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup",
|
110 |
+
"95": "v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos",
|
111 |
+
"96": "v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_",
|
112 |
+
"97": "v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_",
|
113 |
+
"98": "v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_",
|
114 |
+
"99": "v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_",
|
115 |
+
"100": "v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_",
|
116 |
+
"101": "v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_",
|
117 |
+
"102": "v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass",
|
118 |
+
"103": "v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot",
|
119 |
+
"104": "v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec",
|
120 |
+
"105": "v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des",
|
121 |
+
"106": "v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_",
|
122 |
+
"107": "v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_",
|
123 |
+
"108": "v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_",
|
124 |
+
"109": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg",
|
125 |
+
"110": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop",
|
126 |
+
"111": "v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_",
|
127 |
+
"112": "v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos",
|
128 |
+
"113": "v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos",
|
129 |
+
"114": "v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos",
|
130 |
+
"115": "v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos",
|
131 |
+
"116": "v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_",
|
132 |
+
"117": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_",
|
133 |
+
"118": "v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_",
|
134 |
+
"119": "v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_",
|
135 |
+
"120": "v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ",
|
136 |
+
"121": "v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_",
|
137 |
+
"122": "v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_",
|
138 |
+
"123": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_",
|
139 |
+
"124": "v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_",
|
140 |
+
"125": "v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_",
|
141 |
+
"126": "v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_",
|
142 |
+
"127": "v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_",
|
143 |
+
"128": "v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_",
|
144 |
+
"129": "v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_"
|
145 |
},
|
146 |
"initializer_range": 0.02,
|
147 |
"intermediate_size": 3072,
|
148 |
"label2id": {
|
149 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=1|PronType=Prs": 0,
|
150 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=2|PronType=Prs": 1,
|
151 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,Person=3|PronType=Prs": 2,
|
152 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs": 3,
|
153 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u4ed6,PRON,PronType=Prs|Reflex=Yes": 4,
|
154 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=1|PronType=Prs": 5,
|
155 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=2|PronType=Prs": 6,
|
156 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u6b62\u683c,PRON,Person=3|PronType=Prs": 7,
|
157 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=1|PronType=Prs": 8,
|
158 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=2|PronType=Prs": 9,
|
159 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,Person=3|PronType=Prs": 10,
|
160 |
+
"n,\u4ee3\u540d\u8a5e,\u4eba\u79f0,\u8d77\u683c,PRON,PronType=Prs": 11,
|
161 |
+
"n,\u4ee3\u540d\u8a5e,\u6307\u793a,*,PRON,PronType=Dem": 12,
|
162 |
+
"n,\u4ee3\u540d\u8a5e,\u7591\u554f,*,PRON,PronType=Int": 13,
|
163 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u5c5e\u6027,NOUN,_": 14,
|
164 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u75be\u75c5,NOUN,_": 15,
|
165 |
+
"n,\u540d\u8a5e,\u4e0d\u53ef\u8b72,\u8eab\u4f53,NOUN,_": 16,
|
166 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u52d5\u7269,NOUN,_": 17,
|
167 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u56fd\u540d,PROPN,Case=Loc|NameType=Nat": 18,
|
168 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u66f8\u7269,NOUN,_": 19,
|
169 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u6a5f\u95a2,NOUN,_": 20,
|
170 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u795e\u4ecf,NOUN,_": 21,
|
171 |
+
"n,\u540d\u8a5e,\u4e3b\u4f53,\u96c6\u56e3,NOUN,_": 22,
|
172 |
+
"n,\u540d\u8a5e,\u4eba,\u305d\u306e\u4ed6\u306e\u4eba\u540d,PROPN,NameType=Prs": 23,
|
173 |
+
"n,\u540d\u8a5e,\u4eba,\u4eba,NOUN,_": 24,
|
174 |
+
"n,\u540d\u8a5e,\u4eba,\u540d,PROPN,NameType=Giv": 25,
|
175 |
+
"n,\u540d\u8a5e,\u4eba,\u59d3\u6c0f,PROPN,NameType=Sur": 26,
|
176 |
+
"n,\u540d\u8a5e,\u4eba,\u5f79\u5272,NOUN,_": 27,
|
177 |
+
"n,\u540d\u8a5e,\u4eba,\u8907\u5408\u7684\u4eba\u540d,PROPN,NameType=Prs": 28,
|
178 |
+
"n,\u540d\u8a5e,\u4eba,\u95a2\u4fc2,NOUN,_": 29,
|
179 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5100\u793c,NOUN,_": 30,
|
180 |
+
"n,\u540d\u8a5e,\u5236\u5ea6,\u5834,NOUN,Case=Loc": 31,
|
181 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4e57\u308a\u7269,NOUN,_": 32,
|
182 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u4f1d\u9054,NOUN,_": 33,
|
183 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u6210\u679c\u7269,NOUN,_": 34,
|
184 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u7ce7\u98df,NOUN,_": 35,
|
185 |
+
"n,\u540d\u8a5e,\u53ef\u642c,\u9053\u5177,NOUN,_": 36,
|
186 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u540d,PROPN,Case=Loc|NameType=Geo": 37,
|
187 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5730\u5f62,NOUN,Case=Loc": 38,
|
188 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u5efa\u9020\u7269,NOUN,Case=Loc": 39,
|
189 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u6a39\u6728,NOUN,_": 40,
|
190 |
+
"n,\u540d\u8a5e,\u56fa\u5b9a\u7269,\u95a2\u4fc2,NOUN,Case=Loc": 41,
|
191 |
+
"n,\u540d\u8a5e,\u5916\u89b3,\u4eba,NOUN,_": 42,
|
192 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u5929\u6587,NOUN,_": 43,
|
193 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u602a\u7570,NOUN,_": 44,
|
194 |
+
"n,\u540d\u8a5e,\u5929\u8c61,\u6c17\u8c61,NOUN,_": 45,
|
195 |
+
"n,\u540d\u8a5e,\u5ea6\u91cf\u8861,*,NOUN,NounType=Clf": 46,
|
196 |
+
"n,\u540d\u8a5e,\u601d\u8003,\u601d\u8003,NOUN,_": 47,
|
197 |
+
"n,\u540d\u8a5e,\u601d\u8003,\u65b9\u7565,NOUN,_": 48,
|
198 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u5f62\u8cea,NOUN,_": 49,
|
199 |
+
"n,\u540d\u8a5e,\u63cf\u5199,\u614b\u5ea6,NOUN,_": 50,
|
200 |
+
"n,\u540d\u8a5e,\u6570\u91cf,*,NOUN,_": 51,
|
201 |
+
"n,\u540d\u8a5e,\u6642,*,NOUN,Case=Tem": 52,
|
202 |
+
"n,\u540d\u8a5e,\u884c\u70ba,*,NOUN,_": 53,
|
203 |
+
"n,\u6570\u8a5e,\u5e72\u652f,*,NUM,NumType=Ord": 54,
|
204 |
+
"n,\u6570\u8a5e,\u6570,*,NUM,_": 55,
|
205 |
+
"n,\u6570\u8a5e,\u6570\u5b57,*,NUM,_": 56,
|
206 |
+
"p,\u52a9\u8a5e,\u53e5\u672b,*,PART,_": 57,
|
207 |
+
"p,\u52a9\u8a5e,\u53e5\u982d,*,PART,_": 58,
|
208 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4e26\u5217,CCONJ,_": 59,
|
209 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u4f53\u8a00\u5316,PART,_": 60,
|
210 |
+
"p,\u52a9\u8a5e,\u63a5\u7d9a,\u5c5e\u683c,SCONJ,_": 61,
|
211 |
+
"p,\u52a9\u8a5e,\u63d0\u793a,*,PART,_": 62,
|
212 |
+
"p,\u611f\u5606\u8a5e,*,*,INTJ,_": 63,
|
213 |
+
"p,\u63a5\u5c3e\u8f9e,*,*,PART,_": 64,
|
214 |
+
"s,\u6587\u5b57,*,*,SYM,_": 65,
|
215 |
+
"s,\u8a18\u53f7,\u4e00\u822c,*,SYM,_": 66,
|
216 |
+
"s,\u8a18\u53f7,\u53e5\u70b9,*,PUNCT,_": 67,
|
217 |
+
"s,\u8a18\u53f7,\u8aad\u70b9,*,PUNCT,_": 68,
|
218 |
+
"v,\u524d\u7f6e\u8a5e,\u57fa\u76e4,*,ADP,_": 69,
|
219 |
+
"v,\u524d\u7f6e\u8a5e,\u6e90\u6cc9,*,ADP,_": 70,
|
220 |
+
"v,\u524d\u7f6e\u8a5e,\u7d4c\u7531,*,ADP,_": 71,
|
221 |
+
"v,\u524d\u7f6e\u8a5e,\u95a2\u4fc2,*,ADP,_": 72,
|
222 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u63a8\u5b9a,ADV,_": 73,
|
223 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u78ba\u5b9a,ADV,_": 74,
|
224 |
+
"v,\u526f\u8a5e,\u5224\u65ad,\u9006\u63a5,ADV,_": 75,
|
225 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u4f53\u8a00\u5426\u5b9a,ADV,Polarity=Neg": 76,
|
226 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u6709\u754c,ADV,Polarity=Neg": 77,
|
227 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7121\u754c,ADV,Polarity=Neg": 78,
|
228 |
+
"v,\u526f\u8a5e,\u5426\u5b9a,\u7981\u6b62,ADV,Polarity=Neg": 79,
|
229 |
+
"v,\u526f\u8a5e,\u63cf\u5199,*,ADV,_": 80,
|
230 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5909\u5316,ADV,AdvType=Tim": 81,
|
231 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5b8c\u4e86,ADV,AdvType=Tim|Aspect=Perf": 82,
|
232 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u5c06\u6765,ADV,AdvType=Tim|Tense=Fut": 83,
|
233 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u6052\u5e38,ADV,AdvType=Tim": 84,
|
234 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u73fe\u5728,ADV,AdvType=Tim|Tense=Pres": 85,
|
235 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d42\u5c40,ADV,AdvType=Tim": 86,
|
236 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7d99\u8d77,ADV,AdvType=Tim": 87,
|
237 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u7dca\u63a5,ADV,AdvType=Tim": 88,
|
238 |
+
"v,\u526f\u8a5e,\u6642\u76f8,\u904e\u53bb,ADV,AdvType=Tim|Tense=Past": 89,
|
239 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u539f\u56e0,ADV,AdvType=Cau": 90,
|
240 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u53cd\u8a9e,ADV,_": 91,
|
241 |
+
"v,\u526f\u8a5e,\u7591\u554f,\u6240\u5728,ADV,_": 92,
|
242 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u3084\u3084\u9ad8\u5ea6,ADV,AdvType=Deg|Degree=Cmp": 93,
|
243 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u6975\u5ea6,ADV,AdvType=Deg|Degree=Sup": 94,
|
244 |
+
"v,\u526f\u8a5e,\u7a0b\u5ea6,\u8efd\u5ea6,ADV,AdvType=Deg|Degree=Pos": 95,
|
245 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u5171\u540c,ADV,_": 96,
|
246 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u7dcf\u62ec,ADV,_": 97,
|
247 |
+
"v,\u526f\u8a5e,\u7bc4\u56f2,\u9650\u5b9a,ADV,_": 98,
|
248 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u5076\u767a,ADV,_": 99,
|
249 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u91cd\u8907,ADV,_": 100,
|
250 |
+
"v,\u526f\u8a5e,\u983b\u5ea6,\u983b\u7e41,ADV,_": 101,
|
251 |
+
"v,\u52a9\u52d5\u8a5e,\u53d7\u52d5,*,AUX,Voice=Pass": 102,
|
252 |
+
"v,\u52a9\u52d5\u8a5e,\u53ef\u80fd,*,AUX,Mood=Pot": 103,
|
253 |
+
"v,\u52a9\u52d5\u8a5e,\u5fc5\u8981,*,AUX,Mood=Nec": 104,
|
254 |
+
"v,\u52a9\u52d5\u8a5e,\u9858\u671b,*,AUX,Mood=Des": 105,
|
255 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u5236\u5ea6,VERB,_": 106,
|
256 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u6027\u8cea,VERB,_": 107,
|
257 |
+
"v,\u52d5\u8a5e,\u5909\u5316,\u751f\u7269,VERB,_": 108,
|
258 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,Polarity=Neg": 109,
|
259 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,VerbType=Cop": 110,
|
260 |
+
"v,\u52d5\u8a5e,\u5b58\u5728,\u5b58\u5728,VERB,_": 111,
|
261 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5883\u9047,VERB,Degree=Pos": 112,
|
262 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u5f62\u8cea,VERB,Degree=Pos": 113,
|
263 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u614b\u5ea6,VERB,Degree=Pos": 114,
|
264 |
+
"v,\u52d5\u8a5e,\u63cf\u5199,\u91cf,VERB,Degree=Pos": 115,
|
265 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4ea4\u6d41,VERB,_": 116,
|
266 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f1d\u9054,VERB,_": 117,
|
267 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u4f7f\u5f79,VERB,_": 118,
|
268 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5100\u793c,VERB,_": 119,
|
269 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5206\u985e,VERB,Degree=Equ": 120,
|
270 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u52d5\u4f5c,VERB,_": 121,
|
271 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u59ff\u52e2,VERB,_": 122,
|
272 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f79\u5272,VERB,_": 123,
|
273 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u5f97\u5931,VERB,_": 124,
|
274 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u614b\u5ea6,VERB,_": 125,
|
275 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u751f\u7523,VERB,_": 126,
|
276 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u79fb\u52d5,VERB,_": 127,
|
277 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u8a2d\u7f6e,VERB,_": 128,
|
278 |
+
"v,\u52d5\u8a5e,\u884c\u70ba,\u98f2\u98df,VERB,_": 129
|
279 |
},
|
280 |
"layer_norm_eps": 1e-05,
|
281 |
"max_position_embeddings": 514,
|
|
|
286 |
"position_embedding_type": "absolute",
|
287 |
"tokenizer_class": "BertTokenizer",
|
288 |
"torch_dtype": "float32",
|
289 |
+
"transformers_version": "4.11.3",
|
290 |
"type_vocab_size": 1,
|
291 |
"use_cache": true,
|
292 |
"vocab_size": 26318
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:569d41c0e1f35f10d9afaac21fc1196fa38bedb85b9a94382fd02995e57ec835
|
3 |
+
size 423142673
|
suparkanbun/models/labelPOS.txt
CHANGED
@@ -6,7 +6,6 @@ n,代名詞,人称,他,PRON,PronType=Prs|Reflex=Yes
|
|
6 |
n,代名詞,人称,止格,PRON,Person=1|PronType=Prs
|
7 |
n,代名詞,人称,止格,PRON,Person=2|PronType=Prs
|
8 |
n,代名詞,人称,止格,PRON,Person=3|PronType=Prs
|
9 |
-
n,代名詞,人称,止格,PRON,PronType=Prs
|
10 |
n,代名詞,人称,起格,PRON,Person=1|PronType=Prs
|
11 |
n,代名詞,人称,起格,PRON,Person=2|PronType=Prs
|
12 |
n,代名詞,人称,起格,PRON,Person=3|PronType=Prs
|
@@ -20,6 +19,7 @@ n,名詞,主体,動物,NOUN,_
|
|
20 |
n,名詞,主体,国名,PROPN,Case=Loc|NameType=Nat
|
21 |
n,名詞,主体,書物,NOUN,_
|
22 |
n,名詞,主体,機関,NOUN,_
|
|
|
23 |
n,名詞,主体,集団,NOUN,_
|
24 |
n,名詞,人,その他の人名,PROPN,NameType=Prs
|
25 |
n,名詞,人,人,NOUN,_
|
@@ -45,7 +45,8 @@ n,名詞,天象,天文,NOUN,_
|
|
45 |
n,名詞,天象,怪異,NOUN,_
|
46 |
n,名詞,天象,気象,NOUN,_
|
47 |
n,名詞,度量衡,*,NOUN,NounType=Clf
|
48 |
-
n
|
|
|
49 |
n,名詞,描写,形質,NOUN,_
|
50 |
n,名詞,描写,態度,NOUN,_
|
51 |
n,名詞,数量,*,NOUN,_
|
|
|
6 |
n,代名詞,人称,止格,PRON,Person=1|PronType=Prs
|
7 |
n,代名詞,人称,止格,PRON,Person=2|PronType=Prs
|
8 |
n,代名詞,人称,止格,PRON,Person=3|PronType=Prs
|
|
|
9 |
n,代名詞,人称,起格,PRON,Person=1|PronType=Prs
|
10 |
n,代名詞,人称,起格,PRON,Person=2|PronType=Prs
|
11 |
n,代名詞,人称,起格,PRON,Person=3|PronType=Prs
|
|
|
19 |
n,名詞,主体,国名,PROPN,Case=Loc|NameType=Nat
|
20 |
n,名詞,主体,書物,NOUN,_
|
21 |
n,名詞,主体,機関,NOUN,_
|
22 |
+
n,名詞,主体,神仏,NOUN,_
|
23 |
n,名詞,主体,集団,NOUN,_
|
24 |
n,名詞,人,その他の人名,PROPN,NameType=Prs
|
25 |
n,名詞,人,人,NOUN,_
|
|
|
45 |
n,名詞,天象,怪異,NOUN,_
|
46 |
n,名詞,天象,気象,NOUN,_
|
47 |
n,名詞,度量衡,*,NOUN,NounType=Clf
|
48 |
+
n,名詞,思考,思考,NOUN,_
|
49 |
+
n,名詞,思考,方略,NOUN,_
|
50 |
n,名詞,描写,形質,NOUN,_
|
51 |
n,名詞,描写,態度,NOUN,_
|
52 |
n,名詞,数量,*,NOUN,_
|
suparkanbun/models/lzh_kyoto.conllu
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42280a7cd407b29197200fa5e32deb8a33fb86a543dbfed5460443d3a4493249
|
3 |
+
size 27358204
|
tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "special_tokens_map_file": null, "model_max_length": 512, "do_basic_tokenize": true, "never_split": null, "add_prefix_space": true, "name_or_path": "KoichiYasuoka/roberta-classical-chinese-base-char", "tokenizer_class": "BertTokenizer"}
|