Upload tokenizer.json
Browse files- tokenizer.json +24 -3
tokenizer.json
CHANGED
@@ -929,6 +929,24 @@
|
|
929 |
"rstrip": false,
|
930 |
"normalized": false,
|
931 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
932 |
}
|
933 |
],
|
934 |
"normalizer": {
|
@@ -950,7 +968,8 @@
|
|
950 |
"pre_tokenizer": {
|
951 |
"type": "Metaspace",
|
952 |
"replacement": "▁",
|
953 |
-
"add_prefix_space": true
|
|
|
954 |
},
|
955 |
"post_processor": {
|
956 |
"type": "TemplateProcessing",
|
@@ -1009,7 +1028,8 @@
|
|
1009 |
"decoder": {
|
1010 |
"type": "Metaspace",
|
1011 |
"replacement": "▁",
|
1012 |
-
"add_prefix_space": true
|
|
|
1013 |
},
|
1014 |
"model": {
|
1015 |
"type": "Unigram",
|
@@ -129415,6 +129435,7 @@
|
|
129415 |
"<extra_id_0>",
|
129416 |
0.0
|
129417 |
]
|
129418 |
-
]
|
|
|
129419 |
}
|
129420 |
}
|
|
|
929 |
"rstrip": false,
|
930 |
"normalized": false,
|
931 |
"special": true
|
932 |
+
},
|
933 |
+
{
|
934 |
+
"id": 32100,
|
935 |
+
"content": "[PAD]",
|
936 |
+
"single_word": false,
|
937 |
+
"lstrip": false,
|
938 |
+
"rstrip": false,
|
939 |
+
"normalized": false,
|
940 |
+
"special": true
|
941 |
+
},
|
942 |
+
{
|
943 |
+
"id": 32101,
|
944 |
+
"content": "hello_enthusiastic_morning",
|
945 |
+
"single_word": false,
|
946 |
+
"lstrip": false,
|
947 |
+
"rstrip": false,
|
948 |
+
"normalized": true,
|
949 |
+
"special": false
|
950 |
}
|
951 |
],
|
952 |
"normalizer": {
|
|
|
968 |
"pre_tokenizer": {
|
969 |
"type": "Metaspace",
|
970 |
"replacement": "▁",
|
971 |
+
"add_prefix_space": true,
|
972 |
+
"prepend_scheme": "always"
|
973 |
},
|
974 |
"post_processor": {
|
975 |
"type": "TemplateProcessing",
|
|
|
1028 |
"decoder": {
|
1029 |
"type": "Metaspace",
|
1030 |
"replacement": "▁",
|
1031 |
+
"add_prefix_space": true,
|
1032 |
+
"prepend_scheme": "always"
|
1033 |
},
|
1034 |
"model": {
|
1035 |
"type": "Unigram",
|
|
|
129435 |
"<extra_id_0>",
|
129436 |
0.0
|
129437 |
]
|
129438 |
+
],
|
129439 |
+
"byte_fallback": false
|
129440 |
}
|
129441 |
}
|