Spaces:

nvidia
/

audio-flamingo-3

Running on A100

App Files Files Community

SreyanG-NVIDIA commited on 2 days ago

Commit

8ba4304

verified ·

1 Parent(s): cffa0cb

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -153,7 +153,7 @@ with gr.Blocks(css="""
             with gr.Row():
                 with gr.Column():
                     audio_input_single = gr.Audio(type="filepath", label="Upload Audio")
-                    prompt_input_single = gr.Textbox(label="Prompt", placeholder="Ask a question about the audio...")
                     btn_single = gr.Button("Generate Answer")
                     gr.Examples(
@@ -170,12 +170,12 @@ with gr.Blocks(css="""
                     output_single = gr.Textbox(label="Model Response", lines=8)
             btn_single.click(fn=single_turn_infer, inputs=[audio_input_single, prompt_input_single], outputs=output_single)
-        with gr.Tab("🤔 AF-Think"):
             with gr.Row():
                 with gr.Column():
                     audio_input_think = gr.Audio(type="filepath", label="Upload Audio")
-                    prompt_input_think = gr.Textbox(label="Prompt", placeholder="Ask a question about the audio...")
                     btn_think = gr.Button("Generate Answer")
                     gr.Examples(
@@ -183,7 +183,7 @@ with gr.Blocks(css="""
                             ["static/think/audio1.wav", "What are the two people doing in the audio Choose the correct option from the following options:\n(A) One person is demonstrating how to use the equipment\n(B) The two people are discussing how to use the equipment\n(C) The two people are disassembling the equipment\n(D) One person is teaching another person how to use a piece of equipment\nPlease think and reason about the input audio before you respond."],
                             ["static/think/audio2.wav", "Is the boat in the video moving closer or further away? Choose the correct option from the following options:\n(A) Closer\n(B) Further\nPlease think and reason about the input audio before you respond."],
                         ],
-                        inputs=[audio_input_think, prompt_input_think],
                         label="🧪 Try Examples"
                     )
@@ -195,7 +195,7 @@ with gr.Blocks(css="""
         with gr.Tab("💬 Multi-Turn Chat"):
             chatbot = gr.Chatbot(label="Audio Chatbot")
             audio_input_multi = gr.Audio(type="filepath", label="Upload or Replace Audio Context")
-            user_input_multi = gr.Textbox(label="Your message", placeholder="Ask a question about the audio...")
             btn_multi = gr.Button("Send")
             history_state = gr.State([])           # Chat history
             current_audio_state = gr.State(None)   # Most recent audio file path

             with gr.Row():
                 with gr.Column():
                     audio_input_single = gr.Audio(type="filepath", label="Upload Audio")
+                    prompt_input_single = gr.Textbox(label="Prompt", placeholder="Ask a question about the audio...", lines=8)
                     btn_single = gr.Button("Generate Answer")
                     gr.Examples(
                     output_single = gr.Textbox(label="Model Response", lines=8)
             btn_single.click(fn=single_turn_infer, inputs=[audio_input_single, prompt_input_single], outputs=output_single)
+        with gr.Tab("🤔 Think / Long"):
             with gr.Row():
                 with gr.Column():
                     audio_input_think = gr.Audio(type="filepath", label="Upload Audio")
+                    prompt_input_think = gr.Textbox(label="Prompt", placeholder="Ask a question about the audio...", lines=8)
                     btn_think = gr.Button("Generate Answer")
                     gr.Examples(
                             ["static/think/audio1.wav", "What are the two people doing in the audio Choose the correct option from the following options:\n(A) One person is demonstrating how to use the equipment\n(B) The two people are discussing how to use the equipment\n(C) The two people are disassembling the equipment\n(D) One person is teaching another person how to use a piece of equipment\nPlease think and reason about the input audio before you respond."],
                             ["static/think/audio2.wav", "Is the boat in the video moving closer or further away? Choose the correct option from the following options:\n(A) Closer\n(B) Further\nPlease think and reason about the input audio before you respond."],
                         ],
+                        inputs=[audio_input_think, prompt_input_think+"\nPlease think and reason about the input music before you respond."],
                         label="🧪 Try Examples"
                     )
         with gr.Tab("💬 Multi-Turn Chat"):
             chatbot = gr.Chatbot(label="Audio Chatbot")
             audio_input_multi = gr.Audio(type="filepath", label="Upload or Replace Audio Context")
+            user_input_multi = gr.Textbox(label="Your message", placeholder="Ask a question about the audio...", lines=8)
             btn_multi = gr.Button("Send")
             history_state = gr.State([])           # Chat history
             current_audio_state = gr.State(None)   # Most recent audio file path