VlakoResker
commited on
Commit
·
3ca3c16
1
Parent(s):
fbd5903
add tokenizer
Browse files- added_tokens.json +1 -1
- vocab.json +1 -1
added_tokens.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"<s>":
|
|
|
1 |
+
{"<s>": 79, "</s>": 80}
|
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"[PAD]": 0, "[UNK]": 1, "
|
|
|
1 |
+
{"[PAD]": 0, "[UNK]": 1, "á": 2, "r": 3, "с": 4, ")": 5, "я": 6, "j": 7, "…": 8, "s": 9, "ę": 10, "u": 11, "g": 12, "н": 13, "i": 14, "а": 15, "—": 16, "д": 17, "л": 18, "у": 19, "o": 20, "w": 21, "a": 22, "v": 23, "о": 24, "h": 25, "ф": 26, "&": 27, "f": 28, "ш": 29, "ч": 30, "é": 31, "b": 32, "(": 33, "ъ": 34, "y": 35, "q": 36, "б": 37, "–": 38, "’": 39, "ю": 40, "х": 41, "«": 42, "−": 43, "й": 44, "в": 45, " ": 46, "l": 47, "ц": 48, "р": 49, "d": 50, "‑": 51, "p": 52, "ы": 53, "z": 54, "п": 55, "к": 56, "м": 57, "m": 58, "г": 59, "ж": 60, "c": 61, "x": 62, "»": 63, "т": 64, "и": 65, "ō": 66, "t": 67, "ё": 68, "n": 69, "k": 70, "e": 71, "е": 72, "э": 73, "ö": 74, "з": 75, "ä": 76, "ь": 77, "щ": 78}
|