upload
Browse files- data/sanskrit_token_list/bpe_unigram500/bpe.model +3 -0
- data/sanskrit_token_list/bpe_unigram500/bpe.vocab +500 -0
- data/sanskrit_token_list/bpe_unigram500/tokens.txt +500 -0
- data/sanskrit_token_list/bpe_unigram500/train.txt +3 -0
- exp/asr_stats_raw_sanskrit_bpe500/train/feats_stats.npz +3 -0
- exp/asr_train_asr_raw_sanskrit_bpe500/config.yaml +711 -0
- exp/asr_train_asr_raw_sanskrit_bpe500/valid.acc.ave_10best.pth +3 -0
data/sanskrit_token_list/bpe_unigram500/bpe.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8479523d56d02edd35fde51517ab8e262300511106d3d7b94f49f436c999987f
|
3 |
+
size 246335
|
data/sanskrit_token_list/bpe_unigram500/bpe.vocab
ADDED
@@ -0,0 +1,500 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<unk> 0
|
2 |
+
<s> 0
|
3 |
+
</s> 0
|
4 |
+
▁ -3.28502
|
5 |
+
ं -3.3663
|
6 |
+
े -3.68994
|
7 |
+
ा -3.74551
|
8 |
+
ः -3.83449
|
9 |
+
र -4.01342
|
10 |
+
व -4.12588
|
11 |
+
म -4.13212
|
12 |
+
ि -4.2066
|
13 |
+
ो -4.22442
|
14 |
+
ी -4.32804
|
15 |
+
▁स -4.38071
|
16 |
+
न -4.42089
|
17 |
+
त -4.43767
|
18 |
+
▁॥ -4.453
|
19 |
+
क -4.46445
|
20 |
+
य -4.54343
|
21 |
+
म् -4.58134
|
22 |
+
ु -4.60504
|
23 |
+
द -4.60696
|
24 |
+
प -4.61284
|
25 |
+
ल -4.6386
|
26 |
+
▁अ -4.65739
|
27 |
+
स्य -4.67526
|
28 |
+
ति -4.74065
|
29 |
+
स -4.75371
|
30 |
+
्य -4.79863
|
31 |
+
▁न -4.80911
|
32 |
+
▁च -4.89435
|
33 |
+
र् -4.98229
|
34 |
+
श -5.00555
|
35 |
+
ह -5.01599
|
36 |
+
त् -5.10823
|
37 |
+
ग -5.11338
|
38 |
+
▁प्र -5.12576
|
39 |
+
▁त -5.13674
|
40 |
+
▁वि -5.1464
|
41 |
+
॒ -5.15054
|
42 |
+
▁क -5.19256
|
43 |
+
ज -5.2388
|
44 |
+
ण -5.24096
|
45 |
+
ना -5.28419
|
46 |
+
् -5.28435
|
47 |
+
ृ -5.30825
|
48 |
+
▁व -5.31953
|
49 |
+
त्र -5.36902
|
50 |
+
च -5.38532
|
51 |
+
▁य -5.39441
|
52 |
+
ू -5.41528
|
53 |
+
या -5.44013
|
54 |
+
न् -5.47754
|
55 |
+
ता -5.49061
|
56 |
+
क्ष -5.50348
|
57 |
+
॑ -5.5044
|
58 |
+
▁प -5.51506
|
59 |
+
ौ -5.53761
|
60 |
+
ै -5.56035
|
61 |
+
▁म -5.56344
|
62 |
+
▁श -5.60024
|
63 |
+
ष -5.6167
|
64 |
+
भ -5.62716
|
65 |
+
ध -5.66206
|
66 |
+
▁आ -5.66861
|
67 |
+
न्त -5.68184
|
68 |
+
▁ग -5.68568
|
69 |
+
मा -5.71023
|
70 |
+
थ -5.71445
|
71 |
+
वि -5.74223
|
72 |
+
रा -5.75677
|
73 |
+
ख -5.77239
|
74 |
+
▁ह -5.77783
|
75 |
+
▁द -5.79018
|
76 |
+
ित -5.80289
|
77 |
+
नि -5.83023
|
78 |
+
्या -5.83365
|
79 |
+
ते -5.84883
|
80 |
+
ेन -5.85131
|
81 |
+
प्र -5.88431
|
82 |
+
▁इति -5.8928
|
83 |
+
द् -5.90339
|
84 |
+
▁स्व -5.90604
|
85 |
+
तः -5.90692
|
86 |
+
ाय -5.91855
|
87 |
+
ट -5.92272
|
88 |
+
स्त -5.94887
|
89 |
+
वा -5.9602
|
90 |
+
दा -5.96292
|
91 |
+
▁वा -5.97659
|
92 |
+
ाः -5.99624
|
93 |
+
▁भ -6.02596
|
94 |
+
▁ज -6.04663
|
95 |
+
तु -6.05981
|
96 |
+
त्य -6.06614
|
97 |
+
मि -6.08467
|
98 |
+
ष्ट -6.09682
|
99 |
+
रु -6.14564
|
100 |
+
▁नि -6.15356
|
101 |
+
▁एव -6.18819
|
102 |
+
▁सु -6.20581
|
103 |
+
▁१ -6.20761
|
104 |
+
न्ति -6.21163
|
105 |
+
▁इ -6.21962
|
106 |
+
स् -6.22068
|
107 |
+
▁ब -6.22857
|
108 |
+
▁उ -6.24591
|
109 |
+
रि -6.25677
|
110 |
+
ङ्ग -6.26997
|
111 |
+
घ -6.27434
|
112 |
+
▁सर्व -6.28722
|
113 |
+
▁मा -6.29226
|
114 |
+
श्च -6.29641
|
115 |
+
▁पर -6.29729
|
116 |
+
▁ध -6.30305
|
117 |
+
त्व -6.32427
|
118 |
+
न्द -6.33103
|
119 |
+
ां -6.34945
|
120 |
+
पि -6.3545
|
121 |
+
▁श्री -6.36077
|
122 |
+
यं -6.36163
|
123 |
+
सा -6.37449
|
124 |
+
▁सा -6.38411
|
125 |
+
० -6.39855
|
126 |
+
नु -6.40209
|
127 |
+
कार -6.4092
|
128 |
+
यो -6.42085
|
129 |
+
नं -6.42236
|
130 |
+
▁पा -6.4391
|
131 |
+
ने -6.44077
|
132 |
+
क्त -6.44712
|
133 |
+
▁भव -6.45583
|
134 |
+
ास -6.46378
|
135 |
+
ात् -6.46455
|
136 |
+
ब -6.47556
|
137 |
+
ती -6.4758
|
138 |
+
▁र -6.48119
|
139 |
+
त्त -6.49582
|
140 |
+
द्य -6.50821
|
141 |
+
रण -6.51136
|
142 |
+
ला -6.51617
|
143 |
+
द्व -6.53662
|
144 |
+
▁का -6.55994
|
145 |
+
पा -6.56106
|
146 |
+
दि -6.57736
|
147 |
+
धा -6.58115
|
148 |
+
स्थ -6.60008
|
149 |
+
ड -6.60252
|
150 |
+
▁ल -6.60669
|
151 |
+
न्न -6.61221
|
152 |
+
धि -6.61669
|
153 |
+
्वा -6.61918
|
154 |
+
ान् -6.61957
|
155 |
+
भि -6.62558
|
156 |
+
रे -6.6319
|
157 |
+
▁त्व -6.637
|
158 |
+
द्ध -6.63974
|
159 |
+
रूप -6.64052
|
160 |
+
र्थ -6.64152
|
161 |
+
क् -6.65254
|
162 |
+
र्य -6.65933
|
163 |
+
मान -6.66308
|
164 |
+
ये -6.66897
|
165 |
+
रो -6.66945
|
166 |
+
त्वा -6.67258
|
167 |
+
ोऽ -6.67578
|
168 |
+
न्द्र -6.69443
|
169 |
+
ेषु -6.6987
|
170 |
+
णा -6.70841
|
171 |
+
▁हि -6.70933
|
172 |
+
▁तस्य -6.71183
|
173 |
+
तो -6.71396
|
174 |
+
व्य -6.71418
|
175 |
+
▁कु -6.71882
|
176 |
+
देश -6.72193
|
177 |
+
▁भवति -6.72342
|
178 |
+
▁ते -6.72593
|
179 |
+
▁प्रा -6.72735
|
180 |
+
वान् -6.73317
|
181 |
+
▁सम -6.7362
|
182 |
+
सि -6.74754
|
183 |
+
▁२ -6.74913
|
184 |
+
न्य -6.75084
|
185 |
+
ेण -6.75828
|
186 |
+
का -6.76298
|
187 |
+
ानि -6.77141
|
188 |
+
नी -6.77244
|
189 |
+
सु -6.77303
|
190 |
+
▁ॐ -6.77703
|
191 |
+
ानां -6.7803
|
192 |
+
ध्य -6.79199
|
193 |
+
मे -6.79238
|
194 |
+
ैव -6.80511
|
195 |
+
हि -6.80885
|
196 |
+
िक -6.82145
|
197 |
+
स्म -6.82406
|
198 |
+
▁इत्य -6.8256
|
199 |
+
द्र -6.8264
|
200 |
+
१ -6.82691
|
201 |
+
यु -6.827
|
202 |
+
▁मे -6.82707
|
203 |
+
मु -6.82822
|
204 |
+
कृत -6.83927
|
205 |
+
ष्ठ -6.85585
|
206 |
+
ण्ड -6.85592
|
207 |
+
▁देव -6.87604
|
208 |
+
लि -6.88107
|
209 |
+
ैः -6.88373
|
210 |
+
च्छ -6.8868
|
211 |
+
▁तु -6.90667
|
212 |
+
▁अपि -6.90691
|
213 |
+
यः -6.91804
|
214 |
+
२ -6.92197
|
215 |
+
▁कृत -6.9392
|
216 |
+
तं -6.94838
|
217 |
+
िता -6.95536
|
218 |
+
ञ्च -6.95706
|
219 |
+
ष् -6.95964
|
220 |
+
▁ना -6.96352
|
221 |
+
भ्य -6.96635
|
222 |
+
री -6.97774
|
223 |
+
योग -6.9778
|
224 |
+
्यते -6.98361
|
225 |
+
चि -6.99235
|
226 |
+
भाव -6.99591
|
227 |
+
▁कि -7.01019
|
228 |
+
ङ्क -7.01873
|
229 |
+
स्मिन् -7.0191
|
230 |
+
▁पु -7.02222
|
231 |
+
र्ण -7.02342
|
232 |
+
ीय -7.02403
|
233 |
+
म्ब -7.03072
|
234 |
+
पद -7.03398
|
235 |
+
ाम -7.03571
|
236 |
+
▁एत -7.04097
|
237 |
+
र्व -7.04159
|
238 |
+
▁स्म -7.04176
|
239 |
+
▁प्रति -7.05029
|
240 |
+
▁तथा -7.05788
|
241 |
+
▁स् -7.06563
|
242 |
+
र्ग -7.06707
|
243 |
+
प्त -7.06966
|
244 |
+
ठ -7.07039
|
245 |
+
ाह -7.07298
|
246 |
+
▁३ -7.08098
|
247 |
+
भव -7.09609
|
248 |
+
पु -7.09749
|
249 |
+
भा -7.09872
|
250 |
+
▁एक -7.09971
|
251 |
+
ान्त -7.1134
|
252 |
+
▁परि -7.11737
|
253 |
+
ज्ञ -7.11821
|
254 |
+
नो -7.12229
|
255 |
+
▁अस्ति -7.12292
|
256 |
+
९ -7.12759
|
257 |
+
श्र -7.1276
|
258 |
+
▁मन -7.13393
|
259 |
+
स्व -7.13453
|
260 |
+
ार्थ -7.13597
|
261 |
+
▁या -7.14465
|
262 |
+
शि -7.14725
|
263 |
+
जा -7.15055
|
264 |
+
ात्म -7.15093
|
265 |
+
लोक -7.15539
|
266 |
+
राज -7.1582
|
267 |
+
▁वै -7.16634
|
268 |
+
ग्र -7.16922
|
269 |
+
▁जन -7.17131
|
270 |
+
३ -7.18476
|
271 |
+
▁सह -7.18887
|
272 |
+
देव -7.19377
|
273 |
+
ादि -7.19594
|
274 |
+
▁उप -7.1973
|
275 |
+
▁निर् -7.2027
|
276 |
+
र्ष -7.20366
|
277 |
+
शा -7.20835
|
278 |
+
▁दु -7.21324
|
279 |
+
ङ् -7.21533
|
280 |
+
▁राज -7.2375
|
281 |
+
५ -7.23759
|
282 |
+
▁ब्रह्म -7.24062
|
283 |
+
मह -7.25021
|
284 |
+
▁महा -7.25111
|
285 |
+
४ -7.2518
|
286 |
+
ज्ञान -7.25798
|
287 |
+
▁कथ -7.26427
|
288 |
+
ेऽ -7.27204
|
289 |
+
जन -7.27534
|
290 |
+
▁भू -7.28145
|
291 |
+
स्थित -7.28361
|
292 |
+
▁तत् -7.28971
|
293 |
+
श्व -7.29123
|
294 |
+
▁मह -7.29133
|
295 |
+
६ -7.29337
|
296 |
+
स्तु -7.29583
|
297 |
+
सं -7.29597
|
298 |
+
▁व्य -7.30802
|
299 |
+
गुण -7.30949
|
300 |
+
सिद्ध -7.31102
|
301 |
+
चित् -7.31375
|
302 |
+
ायाः -7.31876
|
303 |
+
विषय -7.32191
|
304 |
+
श् -7.32232
|
305 |
+
▁नमः -7.32239
|
306 |
+
त्स -7.33478
|
307 |
+
ाणि -7.33561
|
308 |
+
▁४ -7.3389
|
309 |
+
िका -7.34266
|
310 |
+
प् -7.34801
|
311 |
+
वर्त -7.3507
|
312 |
+
फ -7.35364
|
313 |
+
ापि -7.354
|
314 |
+
स्ति -7.3563
|
315 |
+
हित -7.35961
|
316 |
+
मुख -7.36485
|
317 |
+
चार -7.36919
|
318 |
+
मेव -7.3788
|
319 |
+
▁श्र -7.38193
|
320 |
+
▁क्र -7.38534
|
321 |
+
षा -7.38793
|
322 |
+
दु -7.38897
|
323 |
+
▁ह्रीं -7.4066
|
324 |
+
न्ध -7.40941
|
325 |
+
ब्द -7.40942
|
326 |
+
▁तत्र -7.41291
|
327 |
+
ष्ण -7.41308
|
328 |
+
ग् -7.41926
|
329 |
+
▁आसीत् -7.42156
|
330 |
+
▁रा -7.4319
|
331 |
+
▁ता -7.43358
|
332 |
+
▁विश्व -7.43906
|
333 |
+
▁अस्य -7.4405
|
334 |
+
ल् -7.44403
|
335 |
+
▁मु -7.44922
|
336 |
+
म्भ -7.45178
|
337 |
+
ढ -7.45475
|
338 |
+
▁यत् -7.45532
|
339 |
+
▁नाम -7.46669
|
340 |
+
क्र -7.46954
|
341 |
+
▁शा -7.47137
|
342 |
+
कं -7.48257
|
343 |
+
दर्श -7.4844
|
344 |
+
मपि -7.48483
|
345 |
+
धु -7.48552
|
346 |
+
पाद -7.48836
|
347 |
+
ामि -7.49548
|
348 |
+
लय -7.49988
|
349 |
+
▁शु -7.5008
|
350 |
+
प्य -7.50141
|
351 |
+
काल -7.50751
|
352 |
+
▁राम -7.51115
|
353 |
+
▁शिव -7.52329
|
354 |
+
णि -7.52536
|
355 |
+
▁भारत -7.52841
|
356 |
+
▁५ -7.53003
|
357 |
+
स्थान -7.54459
|
358 |
+
िष्य -7.55599
|
359 |
+
फल -7.55712
|
360 |
+
▁यथा -7.55919
|
361 |
+
ितं -7.55983
|
362 |
+
▁मम -7.56152
|
363 |
+
▁ष -7.56363
|
364 |
+
त्या -7.56643
|
365 |
+
॥ -7.57365
|
366 |
+
ट् -7.58369
|
367 |
+
▁किं -7.58889
|
368 |
+
▁पूर्व -7.58928
|
369 |
+
ग्न -7.59219
|
370 |
+
न्ते -7.59855
|
371 |
+
भाग -7.59859
|
372 |
+
ायां -7.60555
|
373 |
+
यते -7.60781
|
374 |
+
ज्ञा -7.61471
|
375 |
+
क्षण -7.61552
|
376 |
+
च्च -7.61975
|
377 |
+
▁भा -7.62125
|
378 |
+
ऽ -7.62178
|
379 |
+
नेन -7.626
|
380 |
+
▁६ -7.62702
|
381 |
+
ग्रह -7.62714
|
382 |
+
▁तदा -7.62746
|
383 |
+
▁प्रत्य -7.63073
|
384 |
+
▁क्लीं -7.63331
|
385 |
+
विद्या -7.63656
|
386 |
+
शु -7.6393
|
387 |
+
वृत्त -7.63984
|
388 |
+
▁पुन -7.64454
|
389 |
+
▁यो -7.64783
|
390 |
+
▁शि -7.64928
|
391 |
+
परि -7.64967
|
392 |
+
भू -7.65712
|
393 |
+
भूत -7.66556
|
394 |
+
▁काल -7.66596
|
395 |
+
भिः -7.67737
|
396 |
+
▁कर्म -7.68342
|
397 |
+
▁तद -7.68402
|
398 |
+
▁अनु -7.6851
|
399 |
+
▁जीव -7.68929
|
400 |
+
ल्ल -7.69416
|
401 |
+
णी -7.69552
|
402 |
+
▁सदा -7.69793
|
403 |
+
विध -7.6994
|
404 |
+
▁दृष्ट -7.70078
|
405 |
+
माण -7.70289
|
406 |
+
▁प्राप्त -7.71179
|
407 |
+
मण्डल -7.71241
|
408 |
+
र्ध -7.71365
|
409 |
+
स्त्र -7.716
|
410 |
+
शेष -7.71661
|
411 |
+
▁समा -7.71915
|
412 |
+
दृश -7.71916
|
413 |
+
न्तु -7.71986
|
414 |
+
भ्र -7.72128
|
415 |
+
ञ्ज -7.7228
|
416 |
+
▁यदि -7.72639
|
417 |
+
ेषां -7.73414
|
418 |
+
▁गृह -7.73851
|
419 |
+
▁वेद -7.7425
|
420 |
+
भाष -7.74612
|
421 |
+
▁त्रि -7.74926
|
422 |
+
▁कार्य -7.75373
|
423 |
+
पूर्ण -7.75764
|
424 |
+
युक्त -7.76035
|
425 |
+
▁कृ -7.77237
|
426 |
+
▁जात -7.78685
|
427 |
+
छ -7.78691
|
428 |
+
ाऽ -7.7933
|
429 |
+
क्रम -7.82447
|
430 |
+
दिन -7.83062
|
431 |
+
बन्ध -7.83149
|
432 |
+
करण -7.84488
|
433 |
+
पुरुष -7.84923
|
434 |
+
ोऽपि -7.85128
|
435 |
+
▁भक्त -7.86764
|
436 |
+
ाणां -7.86875
|
437 |
+
ख्या -7.87008
|
438 |
+
धान -7.87138
|
439 |
+
▁अन्य -7.87157
|
440 |
+
व्र -7.87624
|
441 |
+
हार -7.87827
|
442 |
+
▁किन्त -7.89689
|
443 |
+
ेश्वर -7.89899
|
444 |
+
हृद -7.90535
|
445 |
+
प्रिय -7.90785
|
446 |
+
क्रिय -7.90832
|
447 |
+
काश -7.90842
|
448 |
+
▁मृ -7.91237
|
449 |
+
▁पञ्च -7.91572
|
450 |
+
नगर -7.91939
|
451 |
+
शास्त्र -7.93618
|
452 |
+
▁बहु -7.93779
|
453 |
+
कल्प -7.94826
|
454 |
+
ई -7.95012
|
455 |
+
ब्र -7.95055
|
456 |
+
▁अभवत् -7.95454
|
457 |
+
पूज -7.96456
|
458 |
+
▁१९ -7.97208
|
459 |
+
▁नित्य -7.97357
|
460 |
+
गच्छ -7.97903
|
461 |
+
ज्ज -8.00158
|
462 |
+
मन्त्र -8.00375
|
463 |
+
ग्रन्थ -8.00938
|
464 |
+
बुद्ध -8.01092
|
465 |
+
ब्ध -8.01214
|
466 |
+
▁भगवत -8.01407
|
467 |
+
▁कृत्वा -8.01755
|
468 |
+
ए -8.0841
|
469 |
+
ऐ -8.08685
|
470 |
+
ँ -8.21152
|
471 |
+
ळ -8.2539
|
472 |
+
ऊ -8.60667
|
473 |
+
ओ -8.61491
|
474 |
+
ञ -8.7015
|
475 |
+
औ -8.76665
|
476 |
+
झ -8.87873
|
477 |
+
ङ -9.14613
|
478 |
+
़ -9.14948
|
479 |
+
इ -9.5364
|
480 |
+
आ -9.85147
|
481 |
+
ॉ -10.1036
|
482 |
+
अ -10.2681
|
483 |
+
ॄ -10.2841
|
484 |
+
उ -10.3623
|
485 |
+
ॆ -10.7518
|
486 |
+
ॅ -11.1313
|
487 |
+
ॢ -11.9611
|
488 |
+
ॊ -12.0861
|
489 |
+
ऱ -12.3957
|
490 |
+
ॐ -13.141
|
491 |
+
ऌ -13.6783
|
492 |
+
ॠ -13.6784
|
493 |
+
ऎ -13.6785
|
494 |
+
ऴ -13.6786
|
495 |
+
ऑ -13.6787
|
496 |
+
ऋ -13.6788
|
497 |
+
८ -13.6789
|
498 |
+
ॡ -13.679
|
499 |
+
७ -13.679
|
500 |
+
॰ -13.679
|
data/sanskrit_token_list/bpe_unigram500/tokens.txt
ADDED
@@ -0,0 +1,500 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<blank>
|
2 |
+
<unk>
|
3 |
+
▁
|
4 |
+
ं
|
5 |
+
े
|
6 |
+
ा
|
7 |
+
ः
|
8 |
+
र
|
9 |
+
व
|
10 |
+
म
|
11 |
+
ि
|
12 |
+
ो
|
13 |
+
ी
|
14 |
+
▁स
|
15 |
+
न
|
16 |
+
त
|
17 |
+
▁॥
|
18 |
+
क
|
19 |
+
य
|
20 |
+
म्
|
21 |
+
ु
|
22 |
+
द
|
23 |
+
प
|
24 |
+
ल
|
25 |
+
▁अ
|
26 |
+
स्य
|
27 |
+
ति
|
28 |
+
स
|
29 |
+
्य
|
30 |
+
▁न
|
31 |
+
▁च
|
32 |
+
र्
|
33 |
+
श
|
34 |
+
ह
|
35 |
+
त्
|
36 |
+
ग
|
37 |
+
▁प्र
|
38 |
+
▁त
|
39 |
+
▁वि
|
40 |
+
॒
|
41 |
+
▁क
|
42 |
+
ज
|
43 |
+
ण
|
44 |
+
ना
|
45 |
+
्
|
46 |
+
ृ
|
47 |
+
▁व
|
48 |
+
त्र
|
49 |
+
च
|
50 |
+
▁य
|
51 |
+
ू
|
52 |
+
या
|
53 |
+
न्
|
54 |
+
ता
|
55 |
+
क्ष
|
56 |
+
॑
|
57 |
+
▁प
|
58 |
+
ौ
|
59 |
+
ै
|
60 |
+
▁म
|
61 |
+
▁श
|
62 |
+
ष
|
63 |
+
भ
|
64 |
+
ध
|
65 |
+
▁आ
|
66 |
+
न्त
|
67 |
+
▁ग
|
68 |
+
मा
|
69 |
+
थ
|
70 |
+
वि
|
71 |
+
रा
|
72 |
+
ख
|
73 |
+
▁ह
|
74 |
+
▁द
|
75 |
+
ित
|
76 |
+
नि
|
77 |
+
्या
|
78 |
+
ते
|
79 |
+
ेन
|
80 |
+
प्र
|
81 |
+
▁इति
|
82 |
+
द्
|
83 |
+
▁स्व
|
84 |
+
तः
|
85 |
+
ाय
|
86 |
+
ट
|
87 |
+
स्त
|
88 |
+
वा
|
89 |
+
दा
|
90 |
+
▁वा
|
91 |
+
ाः
|
92 |
+
▁भ
|
93 |
+
▁ज
|
94 |
+
तु
|
95 |
+
त्य
|
96 |
+
मि
|
97 |
+
ष्ट
|
98 |
+
रु
|
99 |
+
▁नि
|
100 |
+
▁एव
|
101 |
+
▁सु
|
102 |
+
▁१
|
103 |
+
न्ति
|
104 |
+
▁इ
|
105 |
+
स्
|
106 |
+
▁ब
|
107 |
+
▁उ
|
108 |
+
रि
|
109 |
+
ङ्ग
|
110 |
+
घ
|
111 |
+
▁सर्व
|
112 |
+
▁मा
|
113 |
+
श्च
|
114 |
+
▁पर
|
115 |
+
▁ध
|
116 |
+
त्व
|
117 |
+
न्द
|
118 |
+
ां
|
119 |
+
पि
|
120 |
+
▁श्री
|
121 |
+
यं
|
122 |
+
सा
|
123 |
+
▁सा
|
124 |
+
०
|
125 |
+
नु
|
126 |
+
कार
|
127 |
+
यो
|
128 |
+
नं
|
129 |
+
▁पा
|
130 |
+
ने
|
131 |
+
क्त
|
132 |
+
▁भव
|
133 |
+
ास
|
134 |
+
ात्
|
135 |
+
ब
|
136 |
+
ती
|
137 |
+
▁र
|
138 |
+
त्त
|
139 |
+
द्य
|
140 |
+
रण
|
141 |
+
ला
|
142 |
+
द्व
|
143 |
+
▁का
|
144 |
+
पा
|
145 |
+
दि
|
146 |
+
धा
|
147 |
+
स्थ
|
148 |
+
ड
|
149 |
+
▁ल
|
150 |
+
न्न
|
151 |
+
धि
|
152 |
+
्वा
|
153 |
+
ान्
|
154 |
+
भि
|
155 |
+
रे
|
156 |
+
▁त्व
|
157 |
+
द्ध
|
158 |
+
रूप
|
159 |
+
र्थ
|
160 |
+
क्
|
161 |
+
र्य
|
162 |
+
मान
|
163 |
+
ये
|
164 |
+
रो
|
165 |
+
त्वा
|
166 |
+
ोऽ
|
167 |
+
न्द्र
|
168 |
+
ेषु
|
169 |
+
णा
|
170 |
+
▁हि
|
171 |
+
▁तस्य
|
172 |
+
तो
|
173 |
+
व्य
|
174 |
+
▁कु
|
175 |
+
देश
|
176 |
+
▁भवति
|
177 |
+
▁ते
|
178 |
+
▁प्रा
|
179 |
+
वान्
|
180 |
+
▁सम
|
181 |
+
सि
|
182 |
+
▁२
|
183 |
+
न्य
|
184 |
+
ेण
|
185 |
+
का
|
186 |
+
ानि
|
187 |
+
नी
|
188 |
+
सु
|
189 |
+
▁ॐ
|
190 |
+
ानां
|
191 |
+
ध्य
|
192 |
+
मे
|
193 |
+
ैव
|
194 |
+
हि
|
195 |
+
िक
|
196 |
+
स्म
|
197 |
+
▁इत्य
|
198 |
+
द्र
|
199 |
+
१
|
200 |
+
यु
|
201 |
+
▁मे
|
202 |
+
मु
|
203 |
+
कृत
|
204 |
+
ष्ठ
|
205 |
+
ण्ड
|
206 |
+
▁देव
|
207 |
+
लि
|
208 |
+
ैः
|
209 |
+
च्छ
|
210 |
+
▁तु
|
211 |
+
▁अपि
|
212 |
+
यः
|
213 |
+
२
|
214 |
+
▁कृत
|
215 |
+
तं
|
216 |
+
िता
|
217 |
+
ञ्च
|
218 |
+
ष्
|
219 |
+
▁ना
|
220 |
+
भ्य
|
221 |
+
री
|
222 |
+
योग
|
223 |
+
्यते
|
224 |
+
चि
|
225 |
+
भाव
|
226 |
+
▁कि
|
227 |
+
ङ्क
|
228 |
+
स्मिन्
|
229 |
+
▁पु
|
230 |
+
र्ण
|
231 |
+
ीय
|
232 |
+
म्ब
|
233 |
+
पद
|
234 |
+
ाम
|
235 |
+
▁एत
|
236 |
+
र्व
|
237 |
+
▁स्म
|
238 |
+
▁प्रति
|
239 |
+
▁तथा
|
240 |
+
▁स्
|
241 |
+
र्ग
|
242 |
+
प्त
|
243 |
+
ठ
|
244 |
+
ाह
|
245 |
+
▁३
|
246 |
+
भव
|
247 |
+
पु
|
248 |
+
भा
|
249 |
+
▁एक
|
250 |
+
ान्त
|
251 |
+
▁परि
|
252 |
+
ज्ञ
|
253 |
+
नो
|
254 |
+
▁अस्ति
|
255 |
+
९
|
256 |
+
श्र
|
257 |
+
▁मन
|
258 |
+
स्व
|
259 |
+
ार्थ
|
260 |
+
▁या
|
261 |
+
शि
|
262 |
+
जा
|
263 |
+
ात्म
|
264 |
+
लोक
|
265 |
+
राज
|
266 |
+
▁वै
|
267 |
+
ग्र
|
268 |
+
▁जन
|
269 |
+
३
|
270 |
+
▁सह
|
271 |
+
देव
|
272 |
+
ादि
|
273 |
+
▁उप
|
274 |
+
▁निर्
|
275 |
+
र्ष
|
276 |
+
शा
|
277 |
+
▁दु
|
278 |
+
ङ्
|
279 |
+
▁राज
|
280 |
+
५
|
281 |
+
▁ब्रह्म
|
282 |
+
मह
|
283 |
+
▁महा
|
284 |
+
४
|
285 |
+
ज्ञान
|
286 |
+
▁कथ
|
287 |
+
ेऽ
|
288 |
+
जन
|
289 |
+
▁भू
|
290 |
+
स्थित
|
291 |
+
▁तत्
|
292 |
+
श्व
|
293 |
+
▁मह
|
294 |
+
६
|
295 |
+
स्तु
|
296 |
+
सं
|
297 |
+
▁व्य
|
298 |
+
गुण
|
299 |
+
सिद्ध
|
300 |
+
चित्
|
301 |
+
ायाः
|
302 |
+
विषय
|
303 |
+
श्
|
304 |
+
▁नमः
|
305 |
+
त्स
|
306 |
+
ाणि
|
307 |
+
▁४
|
308 |
+
िका
|
309 |
+
प्
|
310 |
+
वर्त
|
311 |
+
फ
|
312 |
+
ापि
|
313 |
+
स्ति
|
314 |
+
हित
|
315 |
+
मुख
|
316 |
+
चार
|
317 |
+
मेव
|
318 |
+
▁श्र
|
319 |
+
▁क्र
|
320 |
+
षा
|
321 |
+
दु
|
322 |
+
▁ह्रीं
|
323 |
+
न्ध
|
324 |
+
ब्द
|
325 |
+
▁तत्र
|
326 |
+
ष्ण
|
327 |
+
ग्
|
328 |
+
▁आसीत्
|
329 |
+
▁रा
|
330 |
+
▁ता
|
331 |
+
▁विश्व
|
332 |
+
▁अस्य
|
333 |
+
ल्
|
334 |
+
▁मु
|
335 |
+
म्भ
|
336 |
+
ढ
|
337 |
+
▁यत्
|
338 |
+
▁नाम
|
339 |
+
क्र
|
340 |
+
▁शा
|
341 |
+
कं
|
342 |
+
दर्श
|
343 |
+
मपि
|
344 |
+
धु
|
345 |
+
पाद
|
346 |
+
ामि
|
347 |
+
लय
|
348 |
+
▁शु
|
349 |
+
प्य
|
350 |
+
काल
|
351 |
+
▁राम
|
352 |
+
▁शिव
|
353 |
+
णि
|
354 |
+
▁भारत
|
355 |
+
▁५
|
356 |
+
स्थान
|
357 |
+
िष्य
|
358 |
+
फल
|
359 |
+
▁यथा
|
360 |
+
ितं
|
361 |
+
▁मम
|
362 |
+
▁ष
|
363 |
+
त्या
|
364 |
+
॥
|
365 |
+
ट्
|
366 |
+
▁किं
|
367 |
+
▁पूर्व
|
368 |
+
ग्न
|
369 |
+
न्ते
|
370 |
+
भाग
|
371 |
+
ायां
|
372 |
+
यते
|
373 |
+
ज्ञा
|
374 |
+
क्षण
|
375 |
+
च्च
|
376 |
+
▁भा
|
377 |
+
ऽ
|
378 |
+
नेन
|
379 |
+
▁६
|
380 |
+
ग्रह
|
381 |
+
▁तदा
|
382 |
+
▁प्रत्य
|
383 |
+
▁क्लीं
|
384 |
+
विद्या
|
385 |
+
शु
|
386 |
+
वृत्त
|
387 |
+
▁पुन
|
388 |
+
▁यो
|
389 |
+
▁शि
|
390 |
+
परि
|
391 |
+
भू
|
392 |
+
भूत
|
393 |
+
▁काल
|
394 |
+
भिः
|
395 |
+
▁कर्म
|
396 |
+
▁तद
|
397 |
+
▁अनु
|
398 |
+
▁जीव
|
399 |
+
ल्ल
|
400 |
+
णी
|
401 |
+
▁सदा
|
402 |
+
विध
|
403 |
+
▁दृष्ट
|
404 |
+
माण
|
405 |
+
▁प्राप्त
|
406 |
+
मण्डल
|
407 |
+
र्ध
|
408 |
+
स्त्र
|
409 |
+
शेष
|
410 |
+
▁समा
|
411 |
+
दृश
|
412 |
+
न्तु
|
413 |
+
भ्र
|
414 |
+
ञ्ज
|
415 |
+
▁यदि
|
416 |
+
ेषां
|
417 |
+
▁गृह
|
418 |
+
▁वेद
|
419 |
+
भाष
|
420 |
+
▁त्रि
|
421 |
+
▁कार्य
|
422 |
+
पूर्ण
|
423 |
+
युक्त
|
424 |
+
▁कृ
|
425 |
+
▁जात
|
426 |
+
छ
|
427 |
+
ाऽ
|
428 |
+
क्रम
|
429 |
+
दिन
|
430 |
+
बन्ध
|
431 |
+
करण
|
432 |
+
पुरुष
|
433 |
+
ोऽपि
|
434 |
+
▁भक्त
|
435 |
+
ाणां
|
436 |
+
ख्या
|
437 |
+
धान
|
438 |
+
▁अन्य
|
439 |
+
व्र
|
440 |
+
हार
|
441 |
+
▁किन्त
|
442 |
+
ेश्वर
|
443 |
+
हृद
|
444 |
+
प्रिय
|
445 |
+
क्रिय
|
446 |
+
काश
|
447 |
+
▁मृ
|
448 |
+
▁पञ्च
|
449 |
+
नगर
|
450 |
+
शास्त्र
|
451 |
+
▁बहु
|
452 |
+
कल्प
|
453 |
+
ई
|
454 |
+
ब्र
|
455 |
+
▁अभवत्
|
456 |
+
पूज
|
457 |
+
▁१९
|
458 |
+
▁नित्य
|
459 |
+
गच्छ
|
460 |
+
ज्ज
|
461 |
+
मन्त्र
|
462 |
+
ग्रन्थ
|
463 |
+
बुद्ध
|
464 |
+
ब्ध
|
465 |
+
▁भगवत
|
466 |
+
▁कृत्वा
|
467 |
+
ए
|
468 |
+
ऐ
|
469 |
+
ँ
|
470 |
+
ळ
|
471 |
+
ऊ
|
472 |
+
ओ
|
473 |
+
ञ
|
474 |
+
औ
|
475 |
+
झ
|
476 |
+
ङ
|
477 |
+
़
|
478 |
+
इ
|
479 |
+
आ
|
480 |
+
ॉ
|
481 |
+
अ
|
482 |
+
ॄ
|
483 |
+
उ
|
484 |
+
ॆ
|
485 |
+
ॅ
|
486 |
+
ॢ
|
487 |
+
ॊ
|
488 |
+
ऱ
|
489 |
+
ॐ
|
490 |
+
ऌ
|
491 |
+
ॠ
|
492 |
+
ऎ
|
493 |
+
���
|
494 |
+
ऑ
|
495 |
+
ऋ
|
496 |
+
८
|
497 |
+
ॡ
|
498 |
+
७
|
499 |
+
॰
|
500 |
+
<sos/eos>
|
data/sanskrit_token_list/bpe_unigram500/train.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a172744a1b64b5eb06b82aba7ba94b8d935a1416297cd0be12b0ec3e67db6597
|
3 |
+
size 7261308
|
exp/asr_stats_raw_sanskrit_bpe500/train/feats_stats.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27b65c52c35a11db4d87927f76a1a8a61af0cdf2b8a85b96fc38bb666b8e28a8
|
3 |
+
size 1402
|
exp/asr_train_asr_raw_sanskrit_bpe500/config.yaml
ADDED
@@ -0,0 +1,711 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
config: conf/train_asr.yaml
|
2 |
+
print_config: false
|
3 |
+
log_level: INFO
|
4 |
+
dry_run: false
|
5 |
+
iterator_type: sequence
|
6 |
+
output_dir: exp/asr_train_asr_raw_sanskrit_bpe500
|
7 |
+
ngpu: 1
|
8 |
+
seed: 2022
|
9 |
+
num_workers: 4
|
10 |
+
num_att_plot: 3
|
11 |
+
dist_backend: nccl
|
12 |
+
dist_init_method: env://
|
13 |
+
dist_world_size: null
|
14 |
+
dist_rank: null
|
15 |
+
local_rank: 0
|
16 |
+
dist_master_addr: null
|
17 |
+
dist_master_port: null
|
18 |
+
dist_launcher: null
|
19 |
+
multiprocessing_distributed: false
|
20 |
+
unused_parameters: false
|
21 |
+
sharded_ddp: false
|
22 |
+
cudnn_enabled: true
|
23 |
+
cudnn_benchmark: false
|
24 |
+
cudnn_deterministic: true
|
25 |
+
collect_stats: false
|
26 |
+
write_collected_feats: false
|
27 |
+
max_epoch: 70
|
28 |
+
patience: null
|
29 |
+
val_scheduler_criterion:
|
30 |
+
- valid
|
31 |
+
- loss
|
32 |
+
early_stopping_criterion:
|
33 |
+
- valid
|
34 |
+
- loss
|
35 |
+
- min
|
36 |
+
best_model_criterion:
|
37 |
+
- - valid
|
38 |
+
- acc
|
39 |
+
- max
|
40 |
+
keep_nbest_models: 10
|
41 |
+
nbest_averaging_interval: 0
|
42 |
+
grad_clip: 5.0
|
43 |
+
grad_clip_type: 2.0
|
44 |
+
grad_noise: false
|
45 |
+
accum_grad: 4
|
46 |
+
no_forward_run: false
|
47 |
+
resume: true
|
48 |
+
train_dtype: float32
|
49 |
+
use_amp: true
|
50 |
+
log_interval: null
|
51 |
+
use_matplotlib: true
|
52 |
+
use_tensorboard: true
|
53 |
+
create_graph_in_tensorboard: false
|
54 |
+
use_wandb: false
|
55 |
+
wandb_project: null
|
56 |
+
wandb_id: null
|
57 |
+
wandb_entity: null
|
58 |
+
wandb_name: null
|
59 |
+
wandb_model_log_interval: -1
|
60 |
+
detect_anomaly: false
|
61 |
+
pretrain_path: null
|
62 |
+
init_param: []
|
63 |
+
ignore_init_mismatch: false
|
64 |
+
freeze_param: []
|
65 |
+
num_iters_per_epoch: null
|
66 |
+
batch_size: 20
|
67 |
+
valid_batch_size: null
|
68 |
+
batch_bins: 10000000
|
69 |
+
valid_batch_bins: null
|
70 |
+
train_shape_file:
|
71 |
+
- exp/asr_stats_raw_sanskrit_bpe500/train/speech_shape
|
72 |
+
- exp/asr_stats_raw_sanskrit_bpe500/train/text_shape.bpe
|
73 |
+
valid_shape_file:
|
74 |
+
- exp/asr_stats_raw_sanskrit_bpe500/valid/speech_shape
|
75 |
+
- exp/asr_stats_raw_sanskrit_bpe500/valid/text_shape.bpe
|
76 |
+
batch_type: numel
|
77 |
+
valid_batch_type: null
|
78 |
+
fold_length:
|
79 |
+
- 80000
|
80 |
+
- 150
|
81 |
+
sort_in_batch: descending
|
82 |
+
shuffle_within_batch: false
|
83 |
+
sort_batch: descending
|
84 |
+
multiple_iterator: false
|
85 |
+
chunk_length: 500
|
86 |
+
chunk_shift_ratio: 0.5
|
87 |
+
num_cache_chunks: 1024
|
88 |
+
chunk_excluded_key_prefixes: []
|
89 |
+
train_data_path_and_name_and_type:
|
90 |
+
- - dump/raw/sanskrit/train/wav.scp
|
91 |
+
- speech
|
92 |
+
- sound
|
93 |
+
- - dump/raw/sanskrit/train/text
|
94 |
+
- text
|
95 |
+
- text
|
96 |
+
valid_data_path_and_name_and_type:
|
97 |
+
- - dump/raw/sanskrit/valid/wav.scp
|
98 |
+
- speech
|
99 |
+
- sound
|
100 |
+
- - dump/raw/sanskrit/valid/text
|
101 |
+
- text
|
102 |
+
- text
|
103 |
+
allow_variable_data_keys: false
|
104 |
+
max_cache_size: 0.0
|
105 |
+
max_cache_fd: 32
|
106 |
+
valid_max_cache_size: null
|
107 |
+
exclude_weight_decay: false
|
108 |
+
exclude_weight_decay_conf: {}
|
109 |
+
optim: adam
|
110 |
+
optim_conf:
|
111 |
+
lr: 0.002
|
112 |
+
weight_decay: 1.0e-06
|
113 |
+
scheduler: warmuplr
|
114 |
+
scheduler_conf:
|
115 |
+
warmup_steps: 15000
|
116 |
+
token_list:
|
117 |
+
- <blank>
|
118 |
+
- <unk>
|
119 |
+
- ▁
|
120 |
+
- ं
|
121 |
+
- े
|
122 |
+
- ा
|
123 |
+
- ः
|
124 |
+
- र
|
125 |
+
- व
|
126 |
+
- म
|
127 |
+
- ि
|
128 |
+
- ो
|
129 |
+
- ी
|
130 |
+
- ▁स
|
131 |
+
- न
|
132 |
+
- त
|
133 |
+
- ▁॥
|
134 |
+
- क
|
135 |
+
- य
|
136 |
+
- म्
|
137 |
+
- ु
|
138 |
+
- द
|
139 |
+
- प
|
140 |
+
- ल
|
141 |
+
- ▁अ
|
142 |
+
- स्य
|
143 |
+
- ति
|
144 |
+
- स
|
145 |
+
- ्य
|
146 |
+
- ▁न
|
147 |
+
- ▁च
|
148 |
+
- र्
|
149 |
+
- श
|
150 |
+
- ह
|
151 |
+
- त्
|
152 |
+
- ग
|
153 |
+
- ▁प्र
|
154 |
+
- ▁त
|
155 |
+
- ▁वि
|
156 |
+
- ॒
|
157 |
+
- ▁क
|
158 |
+
- ज
|
159 |
+
- ण
|
160 |
+
- ना
|
161 |
+
- ्
|
162 |
+
- ृ
|
163 |
+
- ▁व
|
164 |
+
- त्र
|
165 |
+
- च
|
166 |
+
- ▁य
|
167 |
+
- ू
|
168 |
+
- या
|
169 |
+
- न्
|
170 |
+
- ता
|
171 |
+
- क्ष
|
172 |
+
- ॑
|
173 |
+
- ▁प
|
174 |
+
- ौ
|
175 |
+
- ै
|
176 |
+
- ▁म
|
177 |
+
- ▁श
|
178 |
+
- ष
|
179 |
+
- भ
|
180 |
+
- ध
|
181 |
+
- ▁आ
|
182 |
+
- न्त
|
183 |
+
- ▁ग
|
184 |
+
- मा
|
185 |
+
- थ
|
186 |
+
- वि
|
187 |
+
- रा
|
188 |
+
- ख
|
189 |
+
- ▁ह
|
190 |
+
- ▁द
|
191 |
+
- ित
|
192 |
+
- नि
|
193 |
+
- ्या
|
194 |
+
- ते
|
195 |
+
- ेन
|
196 |
+
- प्र
|
197 |
+
- ▁इति
|
198 |
+
- द्
|
199 |
+
- ▁स्व
|
200 |
+
- तः
|
201 |
+
- ाय
|
202 |
+
- ट
|
203 |
+
- स्त
|
204 |
+
- वा
|
205 |
+
- दा
|
206 |
+
- ▁वा
|
207 |
+
- ाः
|
208 |
+
- ▁भ
|
209 |
+
- ▁ज
|
210 |
+
- तु
|
211 |
+
- त्य
|
212 |
+
- मि
|
213 |
+
- ष्ट
|
214 |
+
- रु
|
215 |
+
- ▁नि
|
216 |
+
- ▁एव
|
217 |
+
- ▁सु
|
218 |
+
- ▁१
|
219 |
+
- न्ति
|
220 |
+
- ▁इ
|
221 |
+
- स्
|
222 |
+
- ▁ब
|
223 |
+
- ▁उ
|
224 |
+
- रि
|
225 |
+
- ङ्ग
|
226 |
+
- घ
|
227 |
+
- ▁सर्व
|
228 |
+
- ▁मा
|
229 |
+
- श्च
|
230 |
+
- ▁पर
|
231 |
+
- ▁ध
|
232 |
+
- त्व
|
233 |
+
- न्द
|
234 |
+
- ां
|
235 |
+
- पि
|
236 |
+
- ▁श्री
|
237 |
+
- यं
|
238 |
+
- सा
|
239 |
+
- ▁सा
|
240 |
+
- ०
|
241 |
+
- नु
|
242 |
+
- कार
|
243 |
+
- यो
|
244 |
+
- नं
|
245 |
+
- ▁पा
|
246 |
+
- ने
|
247 |
+
- क्त
|
248 |
+
- ▁भव
|
249 |
+
- ास
|
250 |
+
- ात्
|
251 |
+
- ब
|
252 |
+
- ती
|
253 |
+
- ▁र
|
254 |
+
- त्त
|
255 |
+
- द्य
|
256 |
+
- रण
|
257 |
+
- ला
|
258 |
+
- द्व
|
259 |
+
- ▁का
|
260 |
+
- पा
|
261 |
+
- दि
|
262 |
+
- धा
|
263 |
+
- स्थ
|
264 |
+
- ड
|
265 |
+
- ▁ल
|
266 |
+
- न्न
|
267 |
+
- धि
|
268 |
+
- ्वा
|
269 |
+
- ान्
|
270 |
+
- भि
|
271 |
+
- रे
|
272 |
+
- ▁त्व
|
273 |
+
- द्ध
|
274 |
+
- रूप
|
275 |
+
- र्थ
|
276 |
+
- क्
|
277 |
+
- र्य
|
278 |
+
- मान
|
279 |
+
- ये
|
280 |
+
- रो
|
281 |
+
- त्वा
|
282 |
+
- ोऽ
|
283 |
+
- न्द्र
|
284 |
+
- ेषु
|
285 |
+
- णा
|
286 |
+
- ▁हि
|
287 |
+
- ▁तस्य
|
288 |
+
- तो
|
289 |
+
- व्य
|
290 |
+
- ▁कु
|
291 |
+
- देश
|
292 |
+
- ▁भवति
|
293 |
+
- ▁ते
|
294 |
+
- ▁प्रा
|
295 |
+
- वान्
|
296 |
+
- ▁सम
|
297 |
+
- सि
|
298 |
+
- ▁२
|
299 |
+
- न्य
|
300 |
+
- ेण
|
301 |
+
- का
|
302 |
+
- ानि
|
303 |
+
- नी
|
304 |
+
- सु
|
305 |
+
- ▁ॐ
|
306 |
+
- ानां
|
307 |
+
- ध्य
|
308 |
+
- मे
|
309 |
+
- ैव
|
310 |
+
- हि
|
311 |
+
- िक
|
312 |
+
- स्म
|
313 |
+
- ▁इत्य
|
314 |
+
- द्र
|
315 |
+
- १
|
316 |
+
- यु
|
317 |
+
- ▁मे
|
318 |
+
- मु
|
319 |
+
- कृत
|
320 |
+
- ष्ठ
|
321 |
+
- ण्ड
|
322 |
+
- ▁देव
|
323 |
+
- लि
|
324 |
+
- ैः
|
325 |
+
- च्छ
|
326 |
+
- ▁तु
|
327 |
+
- ▁अपि
|
328 |
+
- यः
|
329 |
+
- २
|
330 |
+
- ▁कृत
|
331 |
+
- तं
|
332 |
+
- िता
|
333 |
+
- ञ्च
|
334 |
+
- ष्
|
335 |
+
- ▁ना
|
336 |
+
- भ्य
|
337 |
+
- री
|
338 |
+
- योग
|
339 |
+
- ्यते
|
340 |
+
- चि
|
341 |
+
- भाव
|
342 |
+
- ▁कि
|
343 |
+
- ङ्क
|
344 |
+
- स्मिन्
|
345 |
+
- ▁पु
|
346 |
+
- र्ण
|
347 |
+
- ीय
|
348 |
+
- म्ब
|
349 |
+
- पद
|
350 |
+
- ाम
|
351 |
+
- ▁एत
|
352 |
+
- र्व
|
353 |
+
- ▁स्म
|
354 |
+
- ▁प्रति
|
355 |
+
- ▁तथा
|
356 |
+
- ▁स्
|
357 |
+
- र्ग
|
358 |
+
- प्त
|
359 |
+
- ठ
|
360 |
+
- ाह
|
361 |
+
- ▁३
|
362 |
+
- भव
|
363 |
+
- पु
|
364 |
+
- भा
|
365 |
+
- ▁एक
|
366 |
+
- ान्त
|
367 |
+
- ▁परि
|
368 |
+
- ज्ञ
|
369 |
+
- नो
|
370 |
+
- ▁अस्ति
|
371 |
+
- ९
|
372 |
+
- श्र
|
373 |
+
- ▁मन
|
374 |
+
- स्व
|
375 |
+
- ार्थ
|
376 |
+
- ▁या
|
377 |
+
- शि
|
378 |
+
- जा
|
379 |
+
- ात्म
|
380 |
+
- लोक
|
381 |
+
- राज
|
382 |
+
- ▁वै
|
383 |
+
- ग्र
|
384 |
+
- ▁जन
|
385 |
+
- ३
|
386 |
+
- ▁सह
|
387 |
+
- देव
|
388 |
+
- ादि
|
389 |
+
- ▁उप
|
390 |
+
- ▁निर्
|
391 |
+
- र्ष
|
392 |
+
- शा
|
393 |
+
- ▁दु
|
394 |
+
- ङ्
|
395 |
+
- ▁राज
|
396 |
+
- ५
|
397 |
+
- ▁ब्रह्म
|
398 |
+
- मह
|
399 |
+
- ▁महा
|
400 |
+
- ४
|
401 |
+
- ज्ञान
|
402 |
+
- ▁कथ
|
403 |
+
- ेऽ
|
404 |
+
- जन
|
405 |
+
- ▁भू
|
406 |
+
- स्थित
|
407 |
+
- ▁तत्
|
408 |
+
- श्व
|
409 |
+
- ▁मह
|
410 |
+
- ६
|
411 |
+
- स्तु
|
412 |
+
- सं
|
413 |
+
- ▁व्य
|
414 |
+
- गुण
|
415 |
+
- सिद्ध
|
416 |
+
- चित्
|
417 |
+
- ायाः
|
418 |
+
- विषय
|
419 |
+
- श्
|
420 |
+
- ▁नमः
|
421 |
+
- त्स
|
422 |
+
- ाणि
|
423 |
+
- ▁४
|
424 |
+
- िका
|
425 |
+
- प्
|
426 |
+
- वर्त
|
427 |
+
- फ
|
428 |
+
- ापि
|
429 |
+
- स्ति
|
430 |
+
- हित
|
431 |
+
- मुख
|
432 |
+
- चार
|
433 |
+
- मेव
|
434 |
+
- ▁श्र
|
435 |
+
- ▁क्र
|
436 |
+
- षा
|
437 |
+
- दु
|
438 |
+
- ▁ह्रीं
|
439 |
+
- न्ध
|
440 |
+
- ब्द
|
441 |
+
- ▁तत्र
|
442 |
+
- ष्ण
|
443 |
+
- ग्
|
444 |
+
- ▁आसीत्
|
445 |
+
- ▁रा
|
446 |
+
- ▁ता
|
447 |
+
- ▁विश्व
|
448 |
+
- ▁अस्य
|
449 |
+
- ल्
|
450 |
+
- ▁मु
|
451 |
+
- म्भ
|
452 |
+
- ढ
|
453 |
+
- ▁यत्
|
454 |
+
- ▁नाम
|
455 |
+
- क्र
|
456 |
+
- ▁शा
|
457 |
+
- कं
|
458 |
+
- दर्श
|
459 |
+
- मपि
|
460 |
+
- धु
|
461 |
+
- पाद
|
462 |
+
- ामि
|
463 |
+
- लय
|
464 |
+
- ▁शु
|
465 |
+
- प्य
|
466 |
+
- काल
|
467 |
+
- ▁राम
|
468 |
+
- ▁शिव
|
469 |
+
- णि
|
470 |
+
- ▁भारत
|
471 |
+
- ▁५
|
472 |
+
- स्थान
|
473 |
+
- िष्य
|
474 |
+
- फल
|
475 |
+
- ▁यथा
|
476 |
+
- ितं
|
477 |
+
- ▁मम
|
478 |
+
- ▁ष
|
479 |
+
- त्या
|
480 |
+
- ॥
|
481 |
+
- ट्
|
482 |
+
- ▁किं
|
483 |
+
- ▁पूर्व
|
484 |
+
- ग्न
|
485 |
+
- न्ते
|
486 |
+
- भाग
|
487 |
+
- ायां
|
488 |
+
- यते
|
489 |
+
- ज्ञा
|
490 |
+
- क्षण
|
491 |
+
- च्च
|
492 |
+
- ▁भा
|
493 |
+
- ऽ
|
494 |
+
- नेन
|
495 |
+
- ▁६
|
496 |
+
- ग्रह
|
497 |
+
- ▁तदा
|
498 |
+
- ▁प्रत्य
|
499 |
+
- ▁क्लीं
|
500 |
+
- विद्या
|
501 |
+
- शु
|
502 |
+
- वृत्त
|
503 |
+
- ▁पुन
|
504 |
+
- ▁यो
|
505 |
+
- ▁शि
|
506 |
+
- परि
|
507 |
+
- भू
|
508 |
+
- भूत
|
509 |
+
- ▁काल
|
510 |
+
- भिः
|
511 |
+
- ▁कर्म
|
512 |
+
- ▁तद
|
513 |
+
- ▁अनु
|
514 |
+
- ▁जीव
|
515 |
+
- ल्ल
|
516 |
+
- णी
|
517 |
+
- ▁सदा
|
518 |
+
- विध
|
519 |
+
- ▁दृष्ट
|
520 |
+
- माण
|
521 |
+
- ▁प्राप्त
|
522 |
+
- मण्डल
|
523 |
+
- र्ध
|
524 |
+
- स्त्र
|
525 |
+
- शेष
|
526 |
+
- ▁समा
|
527 |
+
- दृश
|
528 |
+
- न्तु
|
529 |
+
- भ्र
|
530 |
+
- ञ्ज
|
531 |
+
- ▁यदि
|
532 |
+
- ेषां
|
533 |
+
- ▁गृह
|
534 |
+
- ▁वेद
|
535 |
+
- भाष
|
536 |
+
- ▁त्रि
|
537 |
+
- ▁कार्य
|
538 |
+
- पूर्ण
|
539 |
+
- युक्त
|
540 |
+
- ▁कृ
|
541 |
+
- ▁जात
|
542 |
+
- छ
|
543 |
+
- ाऽ
|
544 |
+
- क्रम
|
545 |
+
- दिन
|
546 |
+
- बन्ध
|
547 |
+
- करण
|
548 |
+
- पुरुष
|
549 |
+
- ोऽपि
|
550 |
+
- ▁भक्त
|
551 |
+
- ाणां
|
552 |
+
- ख्या
|
553 |
+
- धान
|
554 |
+
- ▁अन्य
|
555 |
+
- व्र
|
556 |
+
- हार
|
557 |
+
- ▁किन्त
|
558 |
+
- ेश्वर
|
559 |
+
- हृद
|
560 |
+
- प्रिय
|
561 |
+
- क्रिय
|
562 |
+
- काश
|
563 |
+
- ▁मृ
|
564 |
+
- ▁पञ्च
|
565 |
+
- नगर
|
566 |
+
- शास्त्र
|
567 |
+
- ▁बहु
|
568 |
+
- कल्प
|
569 |
+
- ई
|
570 |
+
- ब्र
|
571 |
+
- ▁अभवत्
|
572 |
+
- पूज
|
573 |
+
- ▁१९
|
574 |
+
- ▁नित्य
|
575 |
+
- गच्छ
|
576 |
+
- ज्ज
|
577 |
+
- मन्त्र
|
578 |
+
- ग्रन्थ
|
579 |
+
- बुद्ध
|
580 |
+
- ब्ध
|
581 |
+
- ▁भगवत
|
582 |
+
- ▁कृत्वा
|
583 |
+
- ए
|
584 |
+
- ऐ
|
585 |
+
- ँ
|
586 |
+
- ळ
|
587 |
+
- ऊ
|
588 |
+
- ओ
|
589 |
+
- ञ
|
590 |
+
- औ
|
591 |
+
- झ
|
592 |
+
- ङ
|
593 |
+
- ़
|
594 |
+
- इ
|
595 |
+
- आ
|
596 |
+
- ॉ
|
597 |
+
- अ
|
598 |
+
- ॄ
|
599 |
+
- उ
|
600 |
+
- ॆ
|
601 |
+
- ॅ
|
602 |
+
- ॢ
|
603 |
+
- ॊ
|
604 |
+
- ऱ
|
605 |
+
- ॐ
|
606 |
+
- ऌ
|
607 |
+
- ॠ
|
608 |
+
- ऎ
|
609 |
+
- ऴ
|
610 |
+
- ऑ
|
611 |
+
- ऋ
|
612 |
+
- ८
|
613 |
+
- ॡ
|
614 |
+
- ७
|
615 |
+
- ॰
|
616 |
+
- <sos/eos>
|
617 |
+
init: null
|
618 |
+
input_size: null
|
619 |
+
ctc_conf:
|
620 |
+
dropout_rate: 0.0
|
621 |
+
ctc_type: builtin
|
622 |
+
reduce: true
|
623 |
+
ignore_nan_grad: null
|
624 |
+
zero_infinity: true
|
625 |
+
joint_net_conf: null
|
626 |
+
use_preprocessor: true
|
627 |
+
token_type: bpe
|
628 |
+
bpemodel: data/sanskrit_token_list/bpe_unigram500/bpe.model
|
629 |
+
non_linguistic_symbols: null
|
630 |
+
cleaner: null
|
631 |
+
g2p: null
|
632 |
+
speech_volume_normalize: null
|
633 |
+
rir_scp: null
|
634 |
+
rir_apply_prob: 1.0
|
635 |
+
noise_scp: null
|
636 |
+
noise_apply_prob: 1.0
|
637 |
+
noise_db_range: '13_15'
|
638 |
+
short_noise_thres: 0.5
|
639 |
+
aux_ctc_tasks: []
|
640 |
+
frontend: default
|
641 |
+
frontend_conf:
|
642 |
+
n_fft: 512
|
643 |
+
win_length: 400
|
644 |
+
hop_length: 160
|
645 |
+
fs: 16k
|
646 |
+
specaug: specaug
|
647 |
+
specaug_conf:
|
648 |
+
apply_time_warp: true
|
649 |
+
time_warp_window: 5
|
650 |
+
time_warp_mode: bicubic
|
651 |
+
apply_freq_mask: true
|
652 |
+
freq_mask_width_range:
|
653 |
+
- 0
|
654 |
+
- 27
|
655 |
+
num_freq_mask: 2
|
656 |
+
apply_time_mask: true
|
657 |
+
time_mask_width_ratio_range:
|
658 |
+
- 0.0
|
659 |
+
- 0.05
|
660 |
+
num_time_mask: 5
|
661 |
+
normalize: global_mvn
|
662 |
+
normalize_conf:
|
663 |
+
stats_file: exp/asr_stats_raw_sanskrit_bpe500/train/feats_stats.npz
|
664 |
+
model: espnet
|
665 |
+
model_conf:
|
666 |
+
ctc_weight: 0.3
|
667 |
+
lsm_weight: 0.1
|
668 |
+
length_normalized_loss: false
|
669 |
+
preencoder: null
|
670 |
+
preencoder_conf: {}
|
671 |
+
encoder: e_branchformer
|
672 |
+
encoder_conf:
|
673 |
+
output_size: 256
|
674 |
+
attention_heads: 4
|
675 |
+
attention_layer_type: rel_selfattn
|
676 |
+
pos_enc_layer_type: rel_pos
|
677 |
+
rel_pos_type: latest
|
678 |
+
cgmlp_linear_units: 1024
|
679 |
+
cgmlp_conv_kernel: 31
|
680 |
+
use_linear_after_conv: false
|
681 |
+
gate_activation: identity
|
682 |
+
num_blocks: 12
|
683 |
+
dropout_rate: 0.1
|
684 |
+
positional_dropout_rate: 0.1
|
685 |
+
attention_dropout_rate: 0.1
|
686 |
+
input_layer: conv2d
|
687 |
+
layer_drop_rate: 0.0
|
688 |
+
linear_units: 1024
|
689 |
+
positionwise_layer_type: linear
|
690 |
+
use_ffn: true
|
691 |
+
macaron_ffn: true
|
692 |
+
merge_conv_kernel: 31
|
693 |
+
postencoder: null
|
694 |
+
postencoder_conf: {}
|
695 |
+
decoder: transformer
|
696 |
+
decoder_conf:
|
697 |
+
attention_heads: 4
|
698 |
+
linear_units: 2048
|
699 |
+
num_blocks: 6
|
700 |
+
dropout_rate: 0.1
|
701 |
+
positional_dropout_rate: 0.1
|
702 |
+
self_attention_dropout_rate: 0.1
|
703 |
+
src_attention_dropout_rate: 0.1
|
704 |
+
layer_drop_rate: 0.0
|
705 |
+
preprocessor: default
|
706 |
+
preprocessor_conf: {}
|
707 |
+
required:
|
708 |
+
- output_dir
|
709 |
+
- token_list
|
710 |
+
version: '202304'
|
711 |
+
distributed: false
|
exp/asr_train_asr_raw_sanskrit_bpe500/valid.acc.ave_10best.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f06bb5017138c0dcae1f5ea12ab4d6d4a7d8edbc22631bef3b049d4a430e8eb9
|
3 |
+
size 140354317
|