add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"
|
|
|
|
| 1 |
+
{"ب": 0, "ظ": 1, "ژ": 2, "ص": 3, "َ": 4, "ط": 5, "ل": 6, "ّ": 7, "ف": 8, "": 9, "گ": 10, "ا": 11, "چ": 12, "ء": 13, "ہ": 15, "د": 16, "ُ": 17, "ٔ": 18, "ق": 19, "م": 20, "ذ": 21, "ھ": 22, "ن": 23, "ڑ": 24, "ٹ": 25, "ع": 26, "ت": 27, "ئ": 28, "خ": 29, "ض": 30, "پ": 31, "ً": 32, "ر": 33, "ش": 34, "ک": 35, "آ": 36, "ڈ": 37, "ی": 38, "و": 39, "س": 40, "ے": 41, "ج": 42, "ح": 43, "غ": 44, "ؤ": 45, "ز": 46, "ِ": 47, "ث": 48, "ں": 49, "|": 14, "[UNK]": 50, "[PAD]": 51}
|