Update README.md
Browse files
README.md
CHANGED
@@ -32,8 +32,8 @@ tokenizer = Tokenizer.from_pretrained("fahadqazi/Sindhi-BPE-Tokenizer")
|
|
32 |
encoded = tokenizer.encode("ڪهڙا حال آهن")
|
33 |
decoded = tokenizer.decode(encoded.ids)
|
34 |
|
35 |
-
print("Encoded tokens: ", encoded.tokens)
|
36 |
-
print("Decoded text: ", decoded)
|
37 |
|
38 |
```
|
39 |
|
|
|
32 |
encoded = tokenizer.encode("ڪهڙا حال آهن")
|
33 |
decoded = tokenizer.decode(encoded.ids)
|
34 |
|
35 |
+
print("Encoded tokens: ", encoded.tokens) # output: ['Úª', 'Ùĩ', 'ÚĻا', 'ĠØŃاÙĦ', 'ĠØ¢ÙĩÙĨ']
|
36 |
+
print("Decoded text: ", decoded) # output: ڪهڙا حال آهن
|
37 |
|
38 |
```
|
39 |
|