Spaces:

musdfakoc
/

local_intelligence

Sleeping

musdfakoc commited on Sep 29, 2024

Commit

99dc7e5

verified ·

1 Parent(s): eaee834

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -164,8 +164,12 @@ def spectrogram_to_audio(magnitude_spectrogram):
     return audio
-# Function to generate audio from an uploaded image
 def generate_audio_from_image(image):
     test_img = image_transform(image).unsqueeze(0).to(device)  # Preprocess image
     # Generate sound spectrogram from the image using the loaded generator
@@ -178,6 +182,7 @@ def generate_audio_from_image(image):
     # Convert audio tensor to numpy and return it for Gradio to handle
     return generated_audio.numpy(), sample_rate
 # Gradio Interface
 def main():
     global generator  # Declare the generator object globally
@@ -190,8 +195,9 @@ def main():
     # Gradio interface: allow users to upload an image and generate audio
     iface = gr.Interface(fn=generate_audio_from_image,
-                         inputs=gr.Image(type="pil"),
-                         outputs=gr.Audio(type="numpy", label="Generated Audio"))
     iface.launch()

     return audio
 def generate_audio_from_image(image):
+    if image is None:
+        raise ValueError("The uploaded image is 'None'. Please check the Gradio input.")
+    # Ensure the image is in the right format
+    print(f"Image received: {type(image)}")  # Debugging: Check if image is received
     test_img = image_transform(image).unsqueeze(0).to(device)  # Preprocess image
     # Generate sound spectrogram from the image using the loaded generator
     # Convert audio tensor to numpy and return it for Gradio to handle
     return generated_audio.numpy(), sample_rate
 # Gradio Interface
 def main():
     global generator  # Declare the generator object globally
     # Gradio interface: allow users to upload an image and generate audio
     iface = gr.Interface(fn=generate_audio_from_image,
+                     inputs=gr.Image(type="pil"),  # PIL type image
+                     outputs=gr.Audio(type="numpy", label="Generated Audio"))
     iface.launch()