Spaces:

musdfakoc
/

local_intelligence

Sleeping

App Files Files Community

musdfakoc commited on Oct 17, 2024

Commit

7ce9286

verified ·

1 Parent(s): adf8868

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -6

app.py CHANGED Viewed

@@ -74,6 +74,13 @@ def save_spectrogram_image(spectrogram, name):
     plt.close()
     return temp_image_path
 # Process the input image and convert to audio
 def process_image(input_image):
     # Generate a unique name based on the current time
@@ -86,6 +93,9 @@ def process_image(input_image):
         pixels = expand_dims(pixels, 0)
         return pixels
     # Preprocess the input
     src_image = load_image(input_image)
@@ -113,27 +123,28 @@ def process_image(input_image):
     audio_file_path = f"{image_name}_generated_audio.wav"
     sf.write(audio_file_path, wav, samplerate=44100)
-    return spectrogram_image_path, audio_file_path  # Return the paths for both spectrogram image and audio
 # Gradio Interface
 def gradio_process_image(input_image):
-    spectrogram_image_path, audio_file_path = process_image(input_image)
     # After Gradio finishes using these files, delete them to avoid keeping them around
     def cleanup():
         os.remove(spectrogram_image_path)
         os.remove(audio_file_path)
-        print(f"Deleted temp files: {spectrogram_image_path}, {audio_file_path}")
-    return spectrogram_image_path, audio_file_path, cleanup
 # Create the Gradio interface
 interface = gr.Interface(
     fn=gradio_process_image,
     inputs=gr.Image(type="pil"),  # Input is an image
-    outputs=[gr.Image(type="filepath"), gr.Audio(type="filepath")],  # Output both spectrogram image and audio file
     title="Image to Audio Generator with Spectrogram Display",
-    description="Upload an image and get an audio file generated using Pix2Pix.",
 )
 # Launch the interface

     plt.close()
     return temp_image_path
+# Save the uploaded image with the same timestamp
+def save_uploaded_image(input_image, name):
+    # Save the uploaded image with the same unique timestamp name
+    uploaded_image_path = f"{name}_uploaded_image.png"
+    input_image.save(uploaded_image_path)
+    return uploaded_image_path
 # Process the input image and convert to audio
 def process_image(input_image):
     # Generate a unique name based on the current time
         pixels = expand_dims(pixels, 0)
         return pixels
+    # Save the uploaded image with the unique timestamp name
+    uploaded_image_path = save_uploaded_image(input_image, image_name)
     # Preprocess the input
     src_image = load_image(input_image)
     audio_file_path = f"{image_name}_generated_audio.wav"
     sf.write(audio_file_path, wav, samplerate=44100)
+    return uploaded_image_path, spectrogram_image_path, audio_file_path  # Return paths for uploaded image, spectrogram, and audio
 # Gradio Interface
 def gradio_process_image(input_image):
+    uploaded_image_path, spectrogram_image_path, audio_file_path = process_image(input_image)
     # After Gradio finishes using these files, delete them to avoid keeping them around
     def cleanup():
+        os.remove(uploaded_image_path)
         os.remove(spectrogram_image_path)
         os.remove(audio_file_path)
+        print(f"Deleted temp files: {uploaded_image_path}, {spectrogram_image_path}, {audio_file_path}")
+    return uploaded_image_path, spectrogram_image_path, audio_file_path, cleanup
 # Create the Gradio interface
 interface = gr.Interface(
     fn=gradio_process_image,
     inputs=gr.Image(type="pil"),  # Input is an image
+    outputs=[gr.File(label="Uploaded Image"), gr.Image(type="filepath"), gr.Audio(type="filepath")],  # Output uploaded image, spectrogram, and audio file
     title="Image to Audio Generator with Spectrogram Display",
+    description="Upload an image, and get an audio file generated using Pix2Pix.",
 )
 # Launch the interface