Spaces:

bobpopboom
/

chaty

Sleeping

hashhac commited on Mar 15

Commit

3931f99

1 Parent(s): 58bcff1

no more int16

Files changed (1) hide show

app.py CHANGED Viewed

@@ -101,13 +101,11 @@ def text_to_speech(text):
         )
     # Convert to numpy array
-    # Make sure speech is float32 before any conversion to avoid the error
     audio_array = speech.cpu().numpy().astype(np.float32)
-    # Normalize and convert to int16 for output
-    audio_array = (audio_array / np.max(np.abs(audio_array) + 1e-6) * 32767).astype(np.int16)
-    # Reshape for fastrtc
     audio_array = audio_array.reshape(1, -1).astype(np.float32)
     return (16000, audio_array)  # SpeechT5 uses 16kHz sample rate

         )
     # Convert to numpy array
     audio_array = speech.cpu().numpy().astype(np.float32)
+    # Normalize the audio
+    audio_array = audio_array / np.max(np.abs(audio_array) + 1e-6)
     audio_array = audio_array.reshape(1, -1).astype(np.float32)
     return (16000, audio_array)  # SpeechT5 uses 16kHz sample rate