musdfakoc commited on
Commit
2efb66f
·
verified ·
1 Parent(s): fbb8eef

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -1
app.py CHANGED
@@ -137,6 +137,7 @@ def magnitude_to_complex_spectrogram(magnitude_spectrogram):
137
  complex_spectrogram = torch.stack([magnitude_spectrogram, zero_phase], dim=-1)
138
  return complex_spectrogram
139
 
 
140
  def spectrogram_to_audio(magnitude_spectrogram):
141
  # Perform inverse log scaling
142
  magnitude_spectrogram = torch.expm1(magnitude_spectrogram)
@@ -150,7 +151,10 @@ def spectrogram_to_audio(magnitude_spectrogram):
150
  # Normalize audio to the range [-1, 1] (standard audio range)
151
  audio = audio / torch.max(torch.abs(audio))
152
 
153
- # Convert audio to 16-bit integer format, as expected for WAV files
 
 
 
154
  audio = (audio * 32767).short()
155
 
156
  return audio
 
137
  complex_spectrogram = torch.stack([magnitude_spectrogram, zero_phase], dim=-1)
138
  return complex_spectrogram
139
 
140
+
141
  def spectrogram_to_audio(magnitude_spectrogram):
142
  # Perform inverse log scaling
143
  magnitude_spectrogram = torch.expm1(magnitude_spectrogram)
 
151
  # Normalize audio to the range [-1, 1] (standard audio range)
152
  audio = audio / torch.max(torch.abs(audio))
153
 
154
+ # Clip the audio to ensure it fits in the range [-1, 1]
155
+ audio = torch.clamp(audio, min=-1, max=1)
156
+
157
+ # Convert to 16-bit PCM format by scaling and casting
158
  audio = (audio * 32767).short()
159
 
160
  return audio