KoichiYasuoka commited on
Commit
25a640c
·
1 Parent(s): 2709dc3

model improved

Browse files
Files changed (3) hide show
  1. config.json +297 -287
  2. pytorch_model.bin +2 -2
  3. supar.model +2 -2
config.json CHANGED
@@ -34,147 +34,149 @@
34
  "22": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
35
  "23": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
36
  "24": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
37
- "25": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
38
- "26": "B-NOUN|\u540d\u8a5e|_",
39
- "27": "B-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
40
- "28": "B-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
41
- "29": "B-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
42
- "30": "B-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
43
- "31": "B-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
44
- "32": "B-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
45
- "33": "B-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
46
- "34": "B-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
47
- "35": "B-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
48
- "36": "B-NUM|\u6570\u8a5e|_",
49
- "37": "B-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
50
- "38": "B-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
51
- "39": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_",
52
- "40": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
53
- "41": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
54
- "42": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
55
- "43": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
56
- "44": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
57
- "45": "B-PART|\u63a5\u5c3e\u8f9e|_",
58
- "46": "B-PART|\u63a5\u982d\u8f9e|_",
59
- "47": "B-PART|\u7d42\u52a9\u8a5e|_",
60
- "48": "B-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
61
- "49": "B-PRON|\u4ee3\u540d\u8a5e|_",
62
- "50": "B-PROPN|\u56fa\u6709\u540d\u8a5e|_",
63
- "51": "B-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
64
- "52": "B-PUNCT|\u8a18\u53f7|_",
65
- "53": "B-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
66
- "54": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
67
- "55": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
68
- "56": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_",
69
- "57": "B-SCONJ|\u63a5\u7d9a\u8a5e|_",
70
- "58": "B-SYM|_|_",
71
- "59": "B-VERB|\u4ed6\u52d5\u8a5e|_",
72
- "60": "B-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
73
- "61": "B-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
74
- "62": "B-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
75
- "63": "B-VERB|\u81ea\u52d5\u8a5e|_",
76
- "64": "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
77
- "65": "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
78
- "66": "B-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
79
- "67": "B-X|_|_",
80
- "68": "CCONJ|\u63a5\u7d9a\u8a5e|_",
81
- "69": "DET|\u9023\u4f53\u8a5e|_",
82
- "70": "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_",
83
- "71": "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
84
- "72": "I-ADP|\u526f\u52a9\u8a5e|_",
85
- "73": "I-ADP|\u683c\u52a9\u8a5e|_",
86
- "74": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
87
- "75": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
88
- "76": "I-ADV|\u526f\u8a5e|_",
89
- "77": "I-ADV|\u526f\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
90
- "78": "I-ADV|\u526f\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
91
- "79": "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
92
- "80": "I-AUX|\u52a9\u52d5\u8a5e|_",
93
- "81": "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
94
- "82": "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
95
- "83": "I-CCONJ|\u63a5\u7d9a\u8a5e|_",
96
- "84": "I-DET|\u9023\u4f53\u8a5e|_",
97
- "85": "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
98
- "86": "I-INTJ|\u9593\u6295\u8a5e|_",
99
- "87": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
100
- "88": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
101
- "89": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
102
- "90": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
103
- "91": "I-NOUN|\u540d\u8a5e|_",
104
- "92": "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
105
- "93": "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
106
- "94": "I-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
107
- "95": "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
108
- "96": "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
109
- "97": "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
110
- "98": "I-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
111
- "99": "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
112
- "100": "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
113
- "101": "I-NUM|\u6570\u8a5e|_",
114
- "102": "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
115
- "103": "I-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
116
- "104": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_",
117
- "105": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
118
- "106": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
119
- "107": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
120
- "108": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
121
- "109": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
122
- "110": "I-PART|\u63a5\u5c3e\u8f9e|_",
123
- "111": "I-PART|\u63a5\u982d\u8f9e|_",
124
- "112": "I-PART|\u7d42\u52a9\u8a5e|_",
125
- "113": "I-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
126
- "114": "I-PRON|\u4ee3\u540d\u8a5e|_",
127
- "115": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_",
128
- "116": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
129
- "117": "I-PUNCT|\u8a18\u53f7|_",
130
- "118": "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
131
- "119": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
132
- "120": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
133
- "121": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_",
134
- "122": "I-SCONJ|\u63a5\u7d9a\u8a5e|_",
135
- "123": "I-SYM|_|_",
136
- "124": "I-VERB|\u4ed6\u52d5\u8a5e|_",
137
- "125": "I-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
138
- "126": "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
139
- "127": "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
140
- "128": "I-VERB|\u81ea\u52d5\u8a5e|_",
141
- "129": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
142
- "130": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
143
- "131": "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
144
- "132": "I-X|_|_",
145
- "133": "INTJ|\u9593\u6295\u8a5e|_",
146
- "134": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
147
- "135": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
148
- "136": "NOUN|\u540d\u8a5e|_",
149
- "137": "NOUN|\u540d\u8a5e|_+ADP|\u526f\u52a9\u8a5e|_",
150
- "138": "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
151
- "139": "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
152
- "140": "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
153
- "141": "NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
154
- "142": "NUM|\u6570\u8a5e|_",
155
- "143": "PART|\u4eba\u79f0\u63a5\u8f9e|_",
156
- "144": "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
157
- "145": "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
158
- "146": "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
159
- "147": "PART|\u63a5\u5c3e\u8f9e|_",
160
- "148": "PART|\u63a5\u982d\u8f9e|_",
161
- "149": "PART|\u7d42\u52a9\u8a5e|_",
162
- "150": "PROPN|\u56fa\u6709\u540d\u8a5e|_",
163
- "151": "PUNCT|\u8a18\u53f7|_",
164
- "152": "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
165
- "153": "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
166
- "154": "SCONJ|\u63a5\u7d9a\u8a5e|_",
167
- "155": "SYM",
168
- "156": "SYM|_|_",
169
- "157": "VERB|\u4ed6\u52d5\u8a5e|_",
170
- "158": "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
171
- "159": "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_",
172
- "160": "VERB|\u5b8c\u5168\u52d5\u8a5e|_",
173
- "161": "VERB|\u81ea\u52d5\u8a5e|_",
174
- "162": "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_",
175
- "163": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
176
- "164": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
177
- "165": "VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_"
 
 
178
  },
179
  "initializer_range": 0.02,
180
  "intermediate_size": 3072,
@@ -204,147 +206,149 @@
204
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 22,
205
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 23,
206
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 24,
207
- "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 25,
208
- "B-NOUN|\u540d\u8a5e|_": 26,
209
- "B-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 27,
210
- "B-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 28,
211
- "B-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 29,
212
- "B-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 30,
213
- "B-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 31,
214
- "B-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 32,
215
- "B-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 33,
216
- "B-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 34,
217
- "B-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 35,
218
- "B-NUM|\u6570\u8a5e|_": 36,
219
- "B-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 37,
220
- "B-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 38,
221
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_": 39,
222
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 40,
223
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 41,
224
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 42,
225
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 43,
226
- "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 44,
227
- "B-PART|\u63a5\u5c3e\u8f9e|_": 45,
228
- "B-PART|\u63a5\u982d\u8f9e|_": 46,
229
- "B-PART|\u7d42\u52a9\u8a5e|_": 47,
230
- "B-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 48,
231
- "B-PRON|\u4ee3\u540d\u8a5e|_": 49,
232
- "B-PROPN|\u56fa\u6709\u540d\u8a5e|_": 50,
233
- "B-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 51,
234
- "B-PUNCT|\u8a18\u53f7|_": 52,
235
- "B-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 53,
236
- "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 54,
237
- "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 55,
238
- "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_": 56,
239
- "B-SCONJ|\u63a5\u7d9a\u8a5e|_": 57,
240
- "B-SYM|_|_": 58,
241
- "B-VERB|\u4ed6\u52d5\u8a5e|_": 59,
242
- "B-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 60,
243
- "B-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 61,
244
- "B-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 62,
245
- "B-VERB|\u81ea\u52d5\u8a5e|_": 63,
246
- "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 64,
247
- "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 65,
248
- "B-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 66,
249
- "B-X|_|_": 67,
250
- "CCONJ|\u63a5\u7d9a\u8a5e|_": 68,
251
- "DET|\u9023\u4f53\u8a5e|_": 69,
252
- "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": 70,
253
- "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 71,
254
- "I-ADP|\u526f\u52a9\u8a5e|_": 72,
255
- "I-ADP|\u683c\u52a9\u8a5e|_": 73,
256
- "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 74,
257
- "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 75,
258
- "I-ADV|\u526f\u8a5e|_": 76,
259
- "I-ADV|\u526f\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 77,
260
- "I-ADV|\u526f\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 78,
261
- "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 79,
262
- "I-AUX|\u52a9\u52d5\u8a5e|_": 80,
263
- "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 81,
264
- "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 82,
265
- "I-CCONJ|\u63a5\u7d9a\u8a5e|_": 83,
266
- "I-DET|\u9023\u4f53\u8a5e|_": 84,
267
- "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 85,
268
- "I-INTJ|\u9593\u6295\u8a5e|_": 86,
269
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 87,
270
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 88,
271
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 89,
272
- "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 90,
273
- "I-NOUN|\u540d\u8a5e|_": 91,
274
- "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 92,
275
- "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 93,
276
- "I-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 94,
277
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 95,
278
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 96,
279
- "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 97,
280
- "I-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 98,
281
- "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 99,
282
- "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 100,
283
- "I-NUM|\u6570\u8a5e|_": 101,
284
- "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 102,
285
- "I-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 103,
286
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_": 104,
287
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 105,
288
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 106,
289
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 107,
290
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 108,
291
- "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 109,
292
- "I-PART|\u63a5\u5c3e\u8f9e|_": 110,
293
- "I-PART|\u63a5\u982d\u8f9e|_": 111,
294
- "I-PART|\u7d42\u52a9\u8a5e|_": 112,
295
- "I-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 113,
296
- "I-PRON|\u4ee3\u540d\u8a5e|_": 114,
297
- "I-PROPN|\u56fa\u6709\u540d\u8a5e|_": 115,
298
- "I-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 116,
299
- "I-PUNCT|\u8a18\u53f7|_": 117,
300
- "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 118,
301
- "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 119,
302
- "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 120,
303
- "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_": 121,
304
- "I-SCONJ|\u63a5\u7d9a\u8a5e|_": 122,
305
- "I-SYM|_|_": 123,
306
- "I-VERB|\u4ed6\u52d5\u8a5e|_": 124,
307
- "I-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 125,
308
- "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 126,
309
- "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 127,
310
- "I-VERB|\u81ea\u52d5\u8a5e|_": 128,
311
- "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 129,
312
- "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 130,
313
- "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 131,
314
- "I-X|_|_": 132,
315
- "INTJ|\u9593\u6295\u8a5e|_": 133,
316
- "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 134,
317
- "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 135,
318
- "NOUN|\u540d\u8a5e|_": 136,
319
- "NOUN|\u540d\u8a5e|_+ADP|\u526f\u52a9\u8a5e|_": 137,
320
- "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 138,
321
- "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 139,
322
- "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 140,
323
- "NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 141,
324
- "NUM|\u6570\u8a5e|_": 142,
325
- "PART|\u4eba\u79f0\u63a5\u8f9e|_": 143,
326
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 144,
327
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 145,
328
- "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 146,
329
- "PART|\u63a5\u5c3e\u8f9e|_": 147,
330
- "PART|\u63a5\u982d\u8f9e|_": 148,
331
- "PART|\u7d42\u52a9\u8a5e|_": 149,
332
- "PROPN|\u56fa\u6709\u540d\u8a5e|_": 150,
333
- "PUNCT|\u8a18\u53f7|_": 151,
334
- "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 152,
335
- "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 153,
336
- "SCONJ|\u63a5\u7d9a\u8a5e|_": 154,
337
- "SYM": 155,
338
- "SYM|_|_": 156,
339
- "VERB|\u4ed6\u52d5\u8a5e|_": 157,
340
- "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 158,
341
- "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_": 159,
342
- "VERB|\u5b8c\u5168\u52d5\u8a5e|_": 160,
343
- "VERB|\u81ea\u52d5\u8a5e|_": 161,
344
- "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_": 162,
345
- "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 163,
346
- "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 164,
347
- "VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 165
 
 
348
  },
349
  "layer_norm_eps": 1e-07,
350
  "max_position_embeddings": 512,
@@ -409,10 +413,6 @@
409
  "nangonna": [
410
  "nangon",
411
  "na"
412
- ],
413
- "\u30ca\u30f3\u30b3\u30f3\u30ca": [
414
- "\u30ca\u30f3\u30b3\u31ff",
415
- "\u30ca"
416
  ]
417
  },
418
  "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": {
@@ -543,6 +543,12 @@
543
  "purai"
544
  ]
545
  },
 
 
 
 
 
 
546
  "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": {
547
  "Omakun": [
548
  "Omak",
@@ -784,6 +790,10 @@
784
  "chi",
785
  "kik"
786
  ],
 
 
 
 
787
  "chitomtekarkar": [
788
  "chi",
789
  "tomtekarkar"
@@ -939,7 +949,7 @@
939
  },
940
  "tokenizer_class": "DebertaV2TokenizerFast",
941
  "torch_dtype": "float32",
942
- "transformers_version": "4.26.1",
943
  "type_vocab_size": 0,
944
  "vocab_size": 6877
945
  }
 
34
  "22": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
35
  "23": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
36
  "24": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
37
+ "25": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
38
+ "26": "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
39
+ "27": "B-NOUN|\u540d\u8a5e|_",
40
+ "28": "B-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
41
+ "29": "B-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
42
+ "30": "B-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
43
+ "31": "B-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
44
+ "32": "B-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
45
+ "33": "B-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
46
+ "34": "B-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
47
+ "35": "B-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
48
+ "36": "B-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
49
+ "37": "B-NUM|\u6570\u8a5e|_",
50
+ "38": "B-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
51
+ "39": "B-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
52
+ "40": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_",
53
+ "41": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
54
+ "42": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
55
+ "43": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
56
+ "44": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
57
+ "45": "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
58
+ "46": "B-PART|\u63a5\u5c3e\u8f9e|_",
59
+ "47": "B-PART|\u63a5\u982d\u8f9e|_",
60
+ "48": "B-PART|\u7d42\u52a9\u8a5e|_",
61
+ "49": "B-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
62
+ "50": "B-PRON|\u4ee3\u540d\u8a5e|_",
63
+ "51": "B-PROPN|\u56fa\u6709\u540d\u8a5e|_",
64
+ "52": "B-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
65
+ "53": "B-PUNCT|\u8a18\u53f7|_",
66
+ "54": "B-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
67
+ "55": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
68
+ "56": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
69
+ "57": "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_",
70
+ "58": "B-SCONJ|\u63a5\u7d9a\u8a5e|_",
71
+ "59": "B-SYM|_|_",
72
+ "60": "B-VERB|\u4ed6\u52d5\u8a5e|_",
73
+ "61": "B-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
74
+ "62": "B-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
75
+ "63": "B-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
76
+ "64": "B-VERB|\u81ea\u52d5\u8a5e|_",
77
+ "65": "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
78
+ "66": "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
79
+ "67": "B-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
80
+ "68": "B-X|_|_",
81
+ "69": "CCONJ|\u63a5\u7d9a\u8a5e|_",
82
+ "70": "DET|\u9023\u4f53\u8a5e|_",
83
+ "71": "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_",
84
+ "72": "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
85
+ "73": "I-ADP|\u526f\u52a9\u8a5e|_",
86
+ "74": "I-ADP|\u683c\u52a9\u8a5e|_",
87
+ "75": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_",
88
+ "76": "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
89
+ "77": "I-ADV|\u526f\u8a5e|_",
90
+ "78": "I-ADV|\u526f\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
91
+ "79": "I-ADV|\u526f\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
92
+ "80": "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
93
+ "81": "I-AUX|\u52a9\u52d5\u8a5e|_",
94
+ "82": "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
95
+ "83": "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
96
+ "84": "I-CCONJ|\u63a5\u7d9a\u8a5e|_",
97
+ "85": "I-DET|\u9023\u4f53\u8a5e|_",
98
+ "86": "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
99
+ "87": "I-INTJ|\u9593\u6295\u8a5e|_",
100
+ "88": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
101
+ "89": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
102
+ "90": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_",
103
+ "91": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
104
+ "92": "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
105
+ "93": "I-NOUN|\u540d\u8a5e|_",
106
+ "94": "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
107
+ "95": "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_",
108
+ "96": "I-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
109
+ "97": "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
110
+ "98": "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_",
111
+ "99": "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
112
+ "100": "I-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
113
+ "101": "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
114
+ "102": "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
115
+ "103": "I-NUM|\u6570\u8a5e|_",
116
+ "104": "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_",
117
+ "105": "I-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
118
+ "106": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_",
119
+ "107": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_",
120
+ "108": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
121
+ "109": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
122
+ "110": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
123
+ "111": "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_",
124
+ "112": "I-PART|\u63a5\u5c3e\u8f9e|_",
125
+ "113": "I-PART|\u63a5\u982d\u8f9e|_",
126
+ "114": "I-PART|\u7d42\u52a9\u8a5e|_",
127
+ "115": "I-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
128
+ "116": "I-PRON|\u4ee3\u540d\u8a5e|_",
129
+ "117": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_",
130
+ "118": "I-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
131
+ "119": "I-PUNCT|\u8a18\u53f7|_",
132
+ "120": "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
133
+ "121": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
134
+ "122": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_",
135
+ "123": "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_",
136
+ "124": "I-SCONJ|\u63a5\u7d9a\u8a5e|_",
137
+ "125": "I-SYM|_|_",
138
+ "126": "I-VERB|\u4ed6\u52d5\u8a5e|_",
139
+ "127": "I-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
140
+ "128": "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
141
+ "129": "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_",
142
+ "130": "I-VERB|\u81ea\u52d5\u8a5e|_",
143
+ "131": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_",
144
+ "132": "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_",
145
+ "133": "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
146
+ "134": "I-X|_|_",
147
+ "135": "INTJ|\u9593\u6295\u8a5e|_",
148
+ "136": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
149
+ "137": "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
150
+ "138": "NOUN|\u540d\u8a5e|_",
151
+ "139": "NOUN|\u540d\u8a5e|_+ADP|\u526f\u52a9\u8a5e|_",
152
+ "140": "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_",
153
+ "141": "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_",
154
+ "142": "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_",
155
+ "143": "NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
156
+ "144": "NUM|\u6570\u8a5e|_",
157
+ "145": "PART|\u4eba\u79f0\u63a5\u8f9e|_",
158
+ "146": "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
159
+ "147": "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
160
+ "148": "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_",
161
+ "149": "PART|\u63a5\u5c3e\u8f9e|_",
162
+ "150": "PART|\u63a5\u982d\u8f9e|_",
163
+ "151": "PART|\u7d42\u52a9\u8a5e|_",
164
+ "152": "PROPN|\u56fa\u6709\u540d\u8a5e|_",
165
+ "153": "PUNCT|\u8a18\u53f7|_",
166
+ "154": "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_",
167
+ "155": "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_",
168
+ "156": "SCONJ|\u63a5\u7d9a\u8a5e|_",
169
+ "157": "SYM",
170
+ "158": "SYM|_|_",
171
+ "159": "VERB|\u4ed6\u52d5\u8a5e|_",
172
+ "160": "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
173
+ "161": "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_",
174
+ "162": "VERB|\u5b8c\u5168\u52d5\u8a5e|_",
175
+ "163": "VERB|\u81ea\u52d5\u8a5e|_",
176
+ "164": "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_",
177
+ "165": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_",
178
+ "166": "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_",
179
+ "167": "VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_"
180
  },
181
  "initializer_range": 0.02,
182
  "intermediate_size": 3072,
 
206
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 22,
207
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 23,
208
  "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 24,
209
+ "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 25,
210
+ "B-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 26,
211
+ "B-NOUN|\u540d\u8a5e|_": 27,
212
+ "B-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 28,
213
+ "B-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 29,
214
+ "B-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 30,
215
+ "B-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 31,
216
+ "B-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 32,
217
+ "B-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 33,
218
+ "B-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 34,
219
+ "B-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 35,
220
+ "B-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 36,
221
+ "B-NUM|\u6570\u8a5e|_": 37,
222
+ "B-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 38,
223
+ "B-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 39,
224
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_": 40,
225
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 41,
226
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 42,
227
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 43,
228
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 44,
229
+ "B-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 45,
230
+ "B-PART|\u63a5\u5c3e\u8f9e|_": 46,
231
+ "B-PART|\u63a5\u982d\u8f9e|_": 47,
232
+ "B-PART|\u7d42\u52a9\u8a5e|_": 48,
233
+ "B-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 49,
234
+ "B-PRON|\u4ee3\u540d\u8a5e|_": 50,
235
+ "B-PROPN|\u56fa\u6709\u540d\u8a5e|_": 51,
236
+ "B-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 52,
237
+ "B-PUNCT|\u8a18\u53f7|_": 53,
238
+ "B-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 54,
239
+ "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 55,
240
+ "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 56,
241
+ "B-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_": 57,
242
+ "B-SCONJ|\u63a5\u7d9a\u8a5e|_": 58,
243
+ "B-SYM|_|_": 59,
244
+ "B-VERB|\u4ed6\u52d5\u8a5e|_": 60,
245
+ "B-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 61,
246
+ "B-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 62,
247
+ "B-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 63,
248
+ "B-VERB|\u81ea\u52d5\u8a5e|_": 64,
249
+ "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 65,
250
+ "B-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 66,
251
+ "B-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 67,
252
+ "B-X|_|_": 68,
253
+ "CCONJ|\u63a5\u7d9a\u8a5e|_": 69,
254
+ "DET|\u9023\u4f53\u8a5e|_": 70,
255
+ "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": 71,
256
+ "DET|\u9023\u4f53\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 72,
257
+ "I-ADP|\u526f\u52a9\u8a5e|_": 73,
258
+ "I-ADP|\u683c\u52a9\u8a5e|_": 74,
259
+ "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_": 75,
260
+ "I-ADP|\u683c\u52a9\u8a5e|_+VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 76,
261
+ "I-ADV|\u526f\u8a5e|_": 77,
262
+ "I-ADV|\u526f\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 78,
263
+ "I-ADV|\u526f\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 79,
264
+ "I-AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 80,
265
+ "I-AUX|\u52a9\u52d5\u8a5e|_": 81,
266
+ "I-AUX|\u52a9\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 82,
267
+ "I-AUX|\u52a9\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 83,
268
+ "I-CCONJ|\u63a5\u7d9a\u8a5e|_": 84,
269
+ "I-DET|\u9023\u4f53\u8a5e|_": 85,
270
+ "I-DET|\u9023\u4f53\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 86,
271
+ "I-INTJ|\u9593\u6295\u8a5e|_": 87,
272
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 88,
273
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 89,
274
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_+NOUN|\u540d\u8a5e|_": 90,
275
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 91,
276
+ "I-NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 92,
277
+ "I-NOUN|\u540d\u8a5e|_": 93,
278
+ "I-NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 94,
279
+ "I-NOUN|\u540d\u8a5e|_+ADV|\u526f\u8a5e|_": 95,
280
+ "I-NOUN|\u540d\u8a5e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 96,
281
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 97,
282
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": 98,
283
+ "I-NOUN|\u540d\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 99,
284
+ "I-NOUN|\u540d\u8a5e|_+SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 100,
285
+ "I-NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 101,
286
+ "I-NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 102,
287
+ "I-NUM|\u6570\u8a5e|_": 103,
288
+ "I-NUM|\u6570\u8a5e|_+NOUN|\u540d\u8a5e|_": 104,
289
+ "I-NUM|\u6570\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 105,
290
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_": 106,
291
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+AUX|\u30c7\u30a2\u30eb\u52d5\u8a5e|_": 107,
292
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 108,
293
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 109,
294
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 110,
295
+ "I-PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u81ea\u52d5\u8a5e|_": 111,
296
+ "I-PART|\u63a5\u5c3e\u8f9e|_": 112,
297
+ "I-PART|\u63a5\u982d\u8f9e|_": 113,
298
+ "I-PART|\u7d42\u52a9\u8a5e|_": 114,
299
+ "I-PART|\u7d42\u52a9\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 115,
300
+ "I-PRON|\u4ee3\u540d\u8a5e|_": 116,
301
+ "I-PROPN|\u56fa\u6709\u540d\u8a5e|_": 117,
302
+ "I-PROPN|\u56fa\u6709\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 118,
303
+ "I-PUNCT|\u8a18\u53f7|_": 119,
304
+ "I-SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 120,
305
+ "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 121,
306
+ "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+ADV|\u526f\u8a5e|_": 122,
307
+ "I-SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_+DET|\u9023\u4f53\u8a5e|_": 123,
308
+ "I-SCONJ|\u63a5\u7d9a\u8a5e|_": 124,
309
+ "I-SYM|_|_": 125,
310
+ "I-VERB|\u4ed6\u52d5\u8a5e|_": 126,
311
+ "I-VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 127,
312
+ "I-VERB|\u4ed6\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 128,
313
+ "I-VERB|\u5b8c\u5168\u52d5\u8a5e|_": 129,
314
+ "I-VERB|\u81ea\u52d5\u8a5e|_": 130,
315
+ "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u4eba\u79f0\u63a5\u8f9e|_": 131,
316
+ "I-VERB|\u81ea\u52d5\u8a5e|_+PART|\u7d42\u52a9\u8a5e|_": 132,
317
+ "I-VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 133,
318
+ "I-X|_|_": 134,
319
+ "INTJ|\u9593\u6295\u8a5e|_": 135,
320
+ "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 136,
321
+ "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 137,
322
+ "NOUN|\u540d\u8a5e|_": 138,
323
+ "NOUN|\u540d\u8a5e|_+ADP|\u526f\u52a9\u8a5e|_": 139,
324
+ "NOUN|\u540d\u8a5e|_+ADP|\u683c\u52a9\u8a5e|_": 140,
325
+ "NOUN|\u540d\u8a5e|_+NOUN|\u4f4d\u7f6e\u540d\u8a5e|_": 141,
326
+ "NOUN|\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": 142,
327
+ "NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 143,
328
+ "NUM|\u6570\u8a5e|_": 144,
329
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_": 145,
330
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 146,
331
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 147,
332
+ "PART|\u4eba\u79f0\u63a5\u8f9e|_+VERB|\u4ed6\u52d5\u8a5e|_": 148,
333
+ "PART|\u63a5\u5c3e\u8f9e|_": 149,
334
+ "PART|\u63a5\u982d\u8f9e|_": 150,
335
+ "PART|\u7d42\u52a9\u8a5e|_": 151,
336
+ "PROPN|\u56fa\u6709\u540d\u8a5e|_": 152,
337
+ "PUNCT|\u8a18\u53f7|_": 153,
338
+ "SCONJ|\u5f8c\u7f6e\u526f\u8a5e|_": 154,
339
+ "SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 155,
340
+ "SCONJ|\u63a5\u7d9a\u8a5e|_": 156,
341
+ "SYM": 157,
342
+ "SYM|_|_": 158,
343
+ "VERB|\u4ed6\u52d5\u8a5e|_": 159,
344
+ "VERB|\u4ed6\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 160,
345
+ "VERB|\u4ed6\u52d5\u8a5e|_+PART|\u63a5\u5c3e\u8f9e|_": 161,
346
+ "VERB|\u5b8c\u5168\u52d5\u8a5e|_": 162,
347
+ "VERB|\u81ea\u52d5\u8a5e|_": 163,
348
+ "VERB|\u81ea\u52d5\u8a5e|_+AUX|\u52a9\u52d5\u8a5e|_": 164,
349
+ "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u540d\u8a5e|_": 165,
350
+ "VERB|\u81ea\u52d5\u8a5e|_+NOUN|\u5f62\u5f0f\u540d\u8a5e|_": 166,
351
+ "VERB|\u81ea\u52d5\u8a5e|_+SCONJ|\u63a5\u7d9a\u52a9\u8a5e|_": 167
352
  },
353
  "layer_norm_eps": 1e-07,
354
  "max_position_embeddings": 512,
 
413
  "nangonna": [
414
  "nangon",
415
  "na"
 
 
 
 
416
  ]
417
  },
418
  "DET|\u9023\u4f53\u8a5e|_+NOUN|\u540d\u8a5e|_": {
 
543
  "purai"
544
  ]
545
  },
546
+ "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+NOUN|\u540d\u8a5e|_": {
547
+ "\u30ad\u30e2\u30eb\u31f1\u30da": [
548
+ "\u30ad\u31fa",
549
+ "\u30aa\u30eb\u31f1\u30da"
550
+ ]
551
+ },
552
  "NOUN|\u4f4d\u7f6e\u540d\u8a5e|_+VERB|\u4ed6\u52d5\u8a5e|_": {
553
  "Omakun": [
554
  "Omak",
 
790
  "chi",
791
  "kik"
792
  ],
793
+ "chitak": [
794
+ "chi",
795
+ "tak"
796
+ ],
797
  "chitomtekarkar": [
798
  "chi",
799
  "tomtekarkar"
 
949
  },
950
  "tokenizer_class": "DebertaV2TokenizerFast",
951
  "torch_dtype": "float32",
952
+ "transformers_version": "4.27.1",
953
  "type_vocab_size": 0,
954
  "vocab_size": 6877
955
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0902d73fae30236420e358b4ef9dd3e44325e31a6564328769c43edfa19a9f9
3
- size 421791123
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2efc5d6f30105e2592b8708338b67623aa7f19376cad9d7bd41cf83e91257c5d
3
+ size 421797267
supar.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9dc80c0cc7f37cc0b27affda69468bdd7cedec99b1d811e580e6519f1f79958
3
- size 467277003
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c368bff0f1b36e1ff7cd7ee0358205bb11dfdfe08068803a244bfce6faad69
3
+ size 467329611