Spaces:

Agents-MCP-Hackathon
/

Audio-Agent

Sleeping

App Files Files Community

YigitSekerci commited on Jun 9

Commit

9afb0c3

1 Parent(s): 5720b20

add guidelines

Browse files

Files changed (1) hide show

src/ui.py +37 -3

src/ui.py CHANGED Viewed

@@ -129,8 +129,8 @@ def create_interface():
         theme=gr.themes.Default(),
     ) as interface:
         gr.Markdown("""
-        # 🎵 Audio Agent - Professional Audio Processing
-        **Supported formats**: MP3, WAV, M4A, FLAC, AAC, OGG
         """)
         # Hidden state to store audio file URLs and custom history
@@ -227,7 +227,41 @@ def create_interface():
             [chatbot, audio_urls_state, custom_history_state],
             [chatbot, output_audio_files, custom_history_state]
         )
     return interface
 if __name__ == "__main__":

         theme=gr.themes.Default(),
     ) as interface:
         gr.Markdown("""
+        # Audio Agent - Your AI Audio Assistant
+        Upload your audio files and tell me what you need. I'll handle the rest!
         """)
         # Hidden state to store audio file URLs and custom history
             [chatbot, audio_urls_state, custom_history_state],
             [chatbot, output_audio_files, custom_history_state]
         )
+        gr.Markdown("""
+        ---
+        """)
+        with gr.Row():
+            gr.Markdown("""
+            ## 🎚️ What I Can Do For You
+            **Audio Manipulation:**
+            - Merge multiple audio files into one continuous track
+            - Cut or trim specific sections from any file
+            - Adjust volume levels (increase or decrease)
+            - Normalize audio levels for consistency
+            - Apply fade-in or fade-out effects for smooth transitions (Mono channel only)
+            - Change playback speed (faster or slower, with pitch change)
+            - Reverse audio for creative effects
+            - Remove silence from beginning or end of files
+            **Analysis & Transcription:** (English only)
+            - Transcribe speech in audio to text
+            - Analyze audio properties (duration, sample rate, etc.)
+            """)
+            gr.Markdown("""
+            ## 💡 Example Requests
+            - *"Merge these two audio files and add a fade-in effect"*
+            - *"Remove the silence at the beginning of this recording"*
+            - *"Transcribe the speech in this audio file"*
+            - *"Increase the volume of the first track and normalize both files"*
+            - *"Cut out the middle section from 1:30 to 2:45"*
+            - *"Make this audio play 1.5x faster"*
+            - *"Apply a fade-out effect to the end of this track"*
+            """)
     return interface
 if __name__ == "__main__":