NGHIA_Test_Edge_TTS_transcript_w_timestamp

Sleeping

App Files Files Community

cnph001 commited on Apr 27

Commit

5eeb00f

verified ·

1 Parent(s): cf1d09e

Update app.py

Browse files

Insert Silence.mp3 to section where marker "SSxxx" is found

Files changed (1) hide show

app.py +7 -10

app.py CHANGED Viewed

@@ -33,9 +33,12 @@ async def paragraph_to_speech(text, voice, rate, pitch):
     for part in parts:
         if re.match(r'SS\d+\.?\d*', part):
             try:
-                silence_duration = float(part[2:])
-                silence_durations.append(silence_duration)
-                audio_segments.append(None) # Placeholder for silence
             except ValueError:
                 print(f"Warning: Invalid silence duration format: {part}")
         elif part.strip():
@@ -43,7 +46,6 @@ async def paragraph_to_speech(text, voice, rate, pitch):
             current_voice = voice
             current_rate = rate
             current_pitch = pitch
             if part.startswith("1F"):
                 processed_text = part[2:]
                 current_voice = voice1F.split(" - ")[0]
@@ -121,11 +123,6 @@ async def text_to_speech(text, voice, rate, pitch):
                     os.remove(segment)  # Clean up individual files
                 except FileNotFoundError:
                     print(f"Warning: Audio file not found: {segment}")
-            elif isinstance(segment, (int, float)):
-                # Basic silence insertion (approximate)
-                silence = b'\x00' * int(segment * 44100 * 2) # Assuming 16-bit mono at 44.1kHz
-                outfile.write(silence)
     return combined_audio_path, None
 # Gradio interface function
@@ -142,7 +139,7 @@ async def create_demo():
     default_voice = "en-US-AndrewMultilingualNeural - en-US (Male)"  # 👈 Pick one of the available voices
     description = """
     Default = male, other voices 1F:US_Emma, 2F:US_Jenny, 3F:HK_Yan, 1M:AU_Will, 2M:IT_Guiseppe,3M:US_Brian,  1C: Childvoice, 1O = OldMan
-    You can insert silence using the marker 'SS' followed by the duration in seconds (e.g., 'SS1.2' for a 1.2-second pause).
     Enter your text, select a voice, and adjust the speech rate and pitch.
     The application will process your text paragraph by paragraph (separated by two blank lines).
     """

     for part in parts:
         if re.match(r'SS\d+\.?\d*', part):
             try:
+                #silence_duration = float(part[2:])
+                silence_path = os.path.join(os.path.dirname(__file__), "Silence.mp3")
+                if os.path.exists(silence_path):
+                     audio_segments.append(silence_path)
+                else:
+                     print(f"Warning: Silence.mp3 not found at {silence_path}")
             except ValueError:
                 print(f"Warning: Invalid silence duration format: {part}")
         elif part.strip():
             current_voice = voice
             current_rate = rate
             current_pitch = pitch
             if part.startswith("1F"):
                 processed_text = part[2:]
                 current_voice = voice1F.split(" - ")[0]
                     os.remove(segment)  # Clean up individual files
                 except FileNotFoundError:
                     print(f"Warning: Audio file not found: {segment}")
     return combined_audio_path, None
 # Gradio interface function
     default_voice = "en-US-AndrewMultilingualNeural - en-US (Male)"  # 👈 Pick one of the available voices
     description = """
     Default = male, other voices 1F:US_Emma, 2F:US_Jenny, 3F:HK_Yan, 1M:AU_Will, 2M:IT_Guiseppe,3M:US_Brian,  1C: Childvoice, 1O = OldMan
+    You can insert silence using the marker 'SS' (This will insert a Silence period from the Silence.mp3 file).
     Enter your text, select a voice, and adjust the speech rate and pitch.
     The application will process your text paragraph by paragraph (separated by two blank lines).
     """