Spaces:

ziqiangao
/

surroundify

Sleeping

App Files Files Community

ziqiangao commited on 19 days ago

Commit

62ee3db

1 Parent(s): a310a15

try it on here

Browse files

Files changed (1) hide show

app.py +72 -4

app.py CHANGED Viewed

@@ -1,7 +1,75 @@
 import gradio as gr
-def greet(name):
-    return "Hello " + name + "!!"
-demo = gr.Interface(fn=greet, inputs="text", outputs="text")
-demo.launch()

 import gradio as gr
+import numpy as np
+import soundfile as sf
+from scipy import signal
+def extract_phantom_center_test(input_file, output_format, rdf=0.99999):
+    output_file = f"other.{output_format}"
+    output_center_file = f"center.{output_format}"
+    data, samplerate = sf.read(input_file)
+    if data.ndim != 2 or data.shape[1] != 2:
+        raise ValueError("A stereo file is required (2 channels)")
+    left = data[:, 0]
+    right = data[:, 1]
+    mono = np.mean(data, axis=1)
+    nperseg = samplerate  # window size
+    noverlap = nperseg // 2  # overlap
+    f, t, Z_left = signal.stft(left, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    f, t, Z_right = signal.stft(right, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    f, t, Z_mono = signal.stft(mono, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    Z_common_left = np.minimum(np.abs(Z_left), np.abs(Z_right)) * np.exp(1j * np.angle(Z_mono))
+    Z_common_right = np.minimum(np.abs(Z_left), np.abs(Z_right)) * np.exp(1j * np.angle(Z_mono))
+    reduction_factor = rdf
+    Z_new_left = Z_left - Z_common_left * reduction_factor
+    Z_new_right = Z_right - Z_common_right * reduction_factor
+    _, new_left = signal.istft(Z_new_left, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    _, new_right = signal.istft(Z_new_right, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    _, common_signal_left = signal.istft(Z_common_left, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    _, common_signal_right = signal.istft(Z_common_right, fs=samplerate, nperseg=nperseg, noverlap=noverlap)
+    new_left = new_left[:len(left)]
+    new_right = new_right[:len(right)]
+    common_signal_left = common_signal_left[:len(left)]
+    common_signal_right = common_signal_right[:len(right)]
+    peak = max(np.max(np.abs(new_left)), np.max(np.abs(new_right)))
+    if peak > 1.0:
+        new_left /= peak
+        new_right /= peak
+    sf.write(output_file, np.column_stack((new_left, new_right)), samplerate)
+    sf.write(output_center_file, np.column_stack((common_signal_left, common_signal_right)), samplerate)
+    return output_file, output_center_file
+with gr.Blocks(title="Phantom Center Extraction", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# Phantom Center Extraction")
+    input_audio = gr.Audio(label="Upload stereo audio", type="filepath")
+    reduction_f = gr.Slider(0.1, 1.0, value=0.99999, step=0.00001, label="Reduction Factor (rdf)", interactive=True)
+    output_format = gr.Dropdown(choices=["flac", "wav"], value="flac", label="Export format")
+    extract_btn = gr.Button("Separate")
+    with gr.Row():
+        side_audio = gr.Audio(label="Other audio", type="filepath", interactive=False)
+        center_audio = gr.Audio(label="Phantom center audio", type="filepath", interactive=False)
+    extract_btn.click(
+        fn=extract_phantom_center_test,
+        inputs=[input_audio, output_format, reduction_f],
+        outputs=[side_audio, center_audio]
+    )
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0")