add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"ش": 0, "آ": 1, "ج": 2, "ڑ": 3, "س": 4, "ِ": 5, "ض": 6, "ط": 7, "": 8, "گ": 9, "خ": 10, "ن": 11, "د": 12, "پ": 13, "ا": 14, "ں": 15, "ذ": 16, "ُ": 17, "ؤ": 18, "ل": 19, "ہ": 20, "ص": 21, "غ": 22, "َ": 23, "و": 24, "ع": 25, "ر": 26, "ھ": 27, "ق": 28, "ب": 29, "ث": 30, "ح": 31, "ٹ": 32, "ز": 33, "چ": 34, "ت": 35, "ء": 36, "ژ": 37, "ظ": 38, "ٔ": 39, "ئ": 40, "ً": 41, "ی": 42, "ے": 43, "ف": 44, "ک": 46, "ّ": 47, "م": 48, "ڈ": 49, "|": 45, "[UNK]": 50, "[PAD]": 51}
|