Spaces:
Running
Running
Commit
·
3a6f187
1
Parent(s):
7ef74ac
app.py
CHANGED
@@ -12,7 +12,9 @@ TOKENIZER_CUSTOM = {
|
|
12 |
"Google mT5": "google/mt5-base",
|
13 |
"Google mT5 Extended": "alakxender/mt5-dhivehi-tokenizer-extended",
|
14 |
"DeBERTa Extended": "alakxender/deberta-dhivehi-tokenizer-extended",
|
15 |
-
"XLM-RoBERTa Extended": "alakxender/xlmr-dhivehi-tokenizer-extended"
|
|
|
|
|
16 |
}
|
17 |
|
18 |
# Suggested stock model paths for the right input
|
@@ -26,7 +28,8 @@ SUGGESTED_STOCK_PATHS = [
|
|
26 |
"microsoft/trocr-base-printed",
|
27 |
"microsoft/deberta-v3-base"
|
28 |
"xlm-roberta-base",
|
29 |
-
"naver-clova-ix/donut-base"
|
|
|
30 |
]
|
31 |
|
32 |
# Cache for loaded tokenizers to avoid reloading
|
|
|
12 |
"Google mT5": "google/mt5-base",
|
13 |
"Google mT5 Extended": "alakxender/mt5-dhivehi-tokenizer-extended",
|
14 |
"DeBERTa Extended": "alakxender/deberta-dhivehi-tokenizer-extended",
|
15 |
+
"XLM-RoBERTa Extended": "alakxender/xlmr-dhivehi-tokenizer-extended",
|
16 |
+
"Bert Extended": "alakxender/bert-dhivehi-tokenizer-extended"
|
17 |
+
|
18 |
}
|
19 |
|
20 |
# Suggested stock model paths for the right input
|
|
|
28 |
"microsoft/trocr-base-printed",
|
29 |
"microsoft/deberta-v3-base"
|
30 |
"xlm-roberta-base",
|
31 |
+
"naver-clova-ix/donut-base",
|
32 |
+
"bert-base-multilingual-cased"
|
33 |
]
|
34 |
|
35 |
# Cache for loaded tokenizers to avoid reloading
|