Spaces:

Athspi
/

Ai-audio

Running

Athspi commited on Jan 12

Commit

700dfd4

verified ·

1 Parent(s): 13b616e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -219,6 +219,10 @@ def detect_voice_activity(audio_file, threshold=0.02):
     # Load the WAV file
     sample_rate, data = wavfile.read(wav_path)
     # Normalize the audio data
     if data.dtype != np.float32:
         data = data.astype(np.float32) / np.iinfo(data.dtype).max

     # Load the WAV file
     sample_rate, data = wavfile.read(wav_path)
+    # If the audio is stereo, convert it to mono by averaging the channels
+    if len(data.shape) > 1:
+        data = np.mean(data, axis=1)
     # Normalize the audio data
     if data.dtype != np.float32:
         data = data.astype(np.float32) / np.iinfo(data.dtype).max