NGHIA_Test_Edge_TTS_transcript_w_timestamp

Sleeping

cnph001 commited on May 7

Commit

85b246d

verified ·

1 Parent(s): 3a7ede0

Update app.py

fix compression

Files changed (1) hide show

app.py CHANGED Viewed

@@ -101,13 +101,18 @@ async def generate_audio_with_voice_prefix(text_segment, default_voice, rate, pi
         if target_duration_ms is not None and os.path.exists(audio_path):
             audio = AudioSegment.from_mp3(audio_path)
             audio_duration_ms = len(audio)
-            if audio_duration_ms > 0 and target_duration_ms > 0:
                 speed_factor = audio_duration_ms / target_duration_ms
                 if speed_factor > 0:
-                    # Use librosa for time stretching with better quality for speech
                     y, sr = librosa.load(audio_path, sr=None)
                     y_stretched = librosa.effects.time_stretch(y, rate=speed_factor)
                     sf.write(audio_path, y_stretched, sr)
         return audio_path
     return None
@@ -251,4 +256,4 @@ async def create_demo():
 if __name__ == "__main__":
     import soundfile as sf # Import soundfile here
     demo = asyncio.run(create_demo())
-    demo.launch()

         if target_duration_ms is not None and os.path.exists(audio_path):
             audio = AudioSegment.from_mp3(audio_path)
             audio_duration_ms = len(audio)
+            print(f"Generated audio duration: {audio_duration_ms}ms, Target duration: {target_duration_ms}ms") # Debug
+            if audio_duration_ms > target_duration_ms and target_duration_ms > 0:
                 speed_factor = audio_duration_ms / target_duration_ms
+                print(f"Speed factor (to reduce duration): {speed_factor}") # Debug
                 if speed_factor > 0:
                     y, sr = librosa.load(audio_path, sr=None)
                     y_stretched = librosa.effects.time_stretch(y, rate=speed_factor)
                     sf.write(audio_path, y_stretched, sr)
+            else:
+                print("Generated audio is not longer than target duration, no speed adjustment.") # Debug
         return audio_path
     return None
 if __name__ == "__main__":
     import soundfile as sf # Import soundfile here
     demo = asyncio.run(create_demo())
+    demo.launch()