Spaces:

sudhanm
/

whisper-largev2-raw-ta-ml

Sleeping

App Files Files Community

sudhanm commited on 15 days ago

Commit

5618139

verified ·

1 Parent(s): 2798eed

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -10

app.py CHANGED Viewed

@@ -15,12 +15,28 @@ LANG_CODES = {
     "Sanskrit": "sa"
 }
 LANG_PRIMERS = {
-    "English": ("", ""),
-    "Tamil": ("The transcript should be in Tamil script.", "Write only in Tamil script without translation."),
-    "Malayalam": ("The transcript should be in Malayalam script.", "Write only in Malayalam script without translation."),
-    "Hindi": ("The transcript should be in Devanagari script.", "Write only in Devanagari script without translation."),
-    "Sanskrit": ("The transcript should be in Devanagari script.", "Write only in Devanagari script without translation.")
 }
 # Script detection regexes
@@ -77,17 +93,17 @@ def transcribe(audio, language_choice):
     lang_code = LANG_CODES[language_choice]
     primer_weak, primer_strong = LANG_PRIMERS[language_choice]
-    # Pass 1: loose mode to get context
     loose_text = transcribe_once(
         audio_path=audio,
         lang_code=lang_code,
-        initial_prompt="",
         beam_size=8,
         temperature=0.4,
         condition_on_previous_text=True
     )
-    # Pass 2: strict mode with context
     strict_prompt = f"{primer_strong}\nContext: {loose_text}"
     strict_text = transcribe_once(
         audio_path=audio,
@@ -98,7 +114,7 @@ def transcribe(audio, language_choice):
         condition_on_previous_text=False
     )
-    # Check script match — if wrong, retry without context, only strict primer
     if not is_script(strict_text, language_choice):
         strict_text = transcribe_once(
             audio_path=audio,
@@ -109,7 +125,7 @@ def transcribe(audio, language_choice):
             condition_on_previous_text=False
         )
-    # Final check before transliteration
     if is_script(strict_text, language_choice):
         hk_translit = transliterate_to_hk(strict_text, language_choice)
     else:

     "Sanskrit": "sa"
 }
+# Stronger primers in native script with example sentences
 LANG_PRIMERS = {
+    "English": (
+        "The transcript should be in English only.",
+        "Write only in English without translation. Example: This is an English sentence."
+    ),
+    "Tamil": (
+        "நகல் தமிழ் எழுத்துக்களில் மட்டும் இருக்க வேண்டும்.",
+        "தமிழ் எழுத்துக்களில் மட்டும் எழுதவும், மொழிபெயர்ப்பு செய்யக்கூடாது. உதாரணம்: இது ஒரு தமிழ் வாக்கியம்."
+    ),
+    "Malayalam": (
+        "ട്രാൻസ്ക്രിപ്റ്റ് മലയാള ലിപിയിൽ ആയിരിക്കണം.",
+        "മലയാള ലിപിയിൽ മാത്രം എഴുതുക, വിവർത്തനം ചെയ്യരുത്. ഉദാഹരണം: ഇതൊരു മലയാള വാക്യമാണ്. എനിക്ക് മലയാളം അറിയാം."
+    ),
+    "Hindi": (
+        "प्रतिलिपि केवल देवनागरी लिपि में होनी चाहिए।",
+        "केवल देवनागरी लिपि में लिखें, अनुवाद न करें। उदाहरण: यह एक हिंदी वाक्य है।"
+    ),
+    "Sanskrit": (
+        "प्रतिलिपि केवल देवनागरी लिपि में होनी चाहिए।",
+        "केवल देवनागरी लिपि में लिखें, अनुवाद न करें। उदाहरण: अहं संस्कृतं जानामि।"
+    )
 }
 # Script detection regexes
     lang_code = LANG_CODES[language_choice]
     primer_weak, primer_strong = LANG_PRIMERS[language_choice]
+    # Pass 1: loose mode to get context (optional weak primer for bias)
     loose_text = transcribe_once(
         audio_path=audio,
         lang_code=lang_code,
+        initial_prompt=primer_weak,  # <-- Weak primer used here too
         beam_size=8,
         temperature=0.4,
         condition_on_previous_text=True
     )
+    # Pass 2: strict mode with strong primer + context
     strict_prompt = f"{primer_strong}\nContext: {loose_text}"
     strict_text = transcribe_once(
         audio_path=audio,
         condition_on_previous_text=False
     )
+    # Check script match — if wrong, retry without context, only strong primer
     if not is_script(strict_text, language_choice):
         strict_text = transcribe_once(
             audio_path=audio,
             condition_on_previous_text=False
         )
+    # Transliteration
     if is_script(strict_text, language_choice):
         hk_translit = transliterate_to_hk(strict_text, language_choice)
     else: