Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -137,6 +137,7 @@ def magnitude_to_complex_spectrogram(magnitude_spectrogram):
|
|
137 |
complex_spectrogram = torch.stack([magnitude_spectrogram, zero_phase], dim=-1)
|
138 |
return complex_spectrogram
|
139 |
|
|
|
140 |
def spectrogram_to_audio(magnitude_spectrogram):
|
141 |
# Perform inverse log scaling
|
142 |
magnitude_spectrogram = torch.expm1(magnitude_spectrogram)
|
@@ -150,7 +151,10 @@ def spectrogram_to_audio(magnitude_spectrogram):
|
|
150 |
# Normalize audio to the range [-1, 1] (standard audio range)
|
151 |
audio = audio / torch.max(torch.abs(audio))
|
152 |
|
153 |
-
#
|
|
|
|
|
|
|
154 |
audio = (audio * 32767).short()
|
155 |
|
156 |
return audio
|
|
|
137 |
complex_spectrogram = torch.stack([magnitude_spectrogram, zero_phase], dim=-1)
|
138 |
return complex_spectrogram
|
139 |
|
140 |
+
|
141 |
def spectrogram_to_audio(magnitude_spectrogram):
|
142 |
# Perform inverse log scaling
|
143 |
magnitude_spectrogram = torch.expm1(magnitude_spectrogram)
|
|
|
151 |
# Normalize audio to the range [-1, 1] (standard audio range)
|
152 |
audio = audio / torch.max(torch.abs(audio))
|
153 |
|
154 |
+
# Clip the audio to ensure it fits in the range [-1, 1]
|
155 |
+
audio = torch.clamp(audio, min=-1, max=1)
|
156 |
+
|
157 |
+
# Convert to 16-bit PCM format by scaling and casting
|
158 |
audio = (audio * 32767).short()
|
159 |
|
160 |
return audio
|