Spaces:

Bils
/

AIPromoStudio

Running

App Files Files Community

Bils commited on Jan 12

Commit

60b6e41

verified ·

1 Parent(s): 0abc339

Update app.py

Browse files

Files changed (1) hide show

app.py +56 -16

app.py CHANGED Viewed

@@ -11,9 +11,8 @@ from transformers import (
 from scipy.io.wavfile import write
 import tempfile
 from dotenv import load_dotenv
-import spaces  # Assumes Hugging Face Spaces library supports `@spaces.GPU`
-# Load environment variables (e.g., Hugging Face token)
 load_dotenv()
 hf_token = os.getenv("HF_TOKEN")
@@ -21,7 +20,7 @@ hf_token = os.getenv("HF_TOKEN")
 # ---------------------------------------------------------------------
 # Load Llama 3 Pipeline with Zero GPU (Encapsulated)
 # ---------------------------------------------------------------------
-@spaces.GPU(duration=300)  # Adjust GPU allocation duration
 def generate_script(user_prompt: str, model_id: str, token: str):
     try:
         tokenizer = AutoTokenizer.from_pretrained(model_id, use_auth_token=token)
@@ -35,9 +34,10 @@ def generate_script(user_prompt: str, model_id: str, token: str):
         llama_pipeline = pipeline("text-generation", model=model, tokenizer=tokenizer)
         system_prompt = (
-            "You are a top-tier radio imaging producer using Llama 3. "
-            "Take the user's concept and craft a short, creative promo script."
-        )
         combined_prompt = f"{system_prompt}\nUser concept: {user_prompt}\nRefined script:"
         result = llama_pipeline(combined_prompt, max_new_tokens=200, do_sample=True, temperature=0.9)
         return result[0]["generated_text"].split("Refined script:")[-1].strip()
@@ -85,23 +85,63 @@ def interface_generate_audio(script, audio_length):
 # Interface
 # ---------------------------------------------------------------------
 with gr.Blocks() as demo:
-    gr.Markdown("# 🎧 AI Radio Imaging with Llama 3 + MusicGen (Zero GPU)")
     with gr.Row():
         user_prompt = gr.Textbox(
-            label="Enter your promo idea",
-            placeholder="E.g., A 15-second hype jingle for a morning talk show.",
         )
         llama_model_id = gr.Textbox(
-            label="Llama 3 Model ID", value="meta-llama/Meta-Llama-3-8B-Instruct"
         )
-        audio_length = gr.Slider(label="Audio Length (tokens)", minimum=128, maximum=1024, step=64, value=512)
-    generate_script_button = gr.Button("Generate Script")
-    script_output = gr.Textbox(label="Generated Script")
-    generate_audio_button = gr.Button("Generate Audio")
-    audio_output = gr.Audio(label="Generated Audio", type="filepath")
     generate_script_button.click(
         fn=interface_generate_script,
         inputs=[user_prompt, llama_model_id],

 from scipy.io.wavfile import write
 import tempfile
 from dotenv import load_dotenv
+import spaces
 load_dotenv()
 hf_token = os.getenv("HF_TOKEN")
 # ---------------------------------------------------------------------
 # Load Llama 3 Pipeline with Zero GPU (Encapsulated)
 # ---------------------------------------------------------------------
+@spaces.GPU(duration=300)
 def generate_script(user_prompt: str, model_id: str, token: str):
     try:
         tokenizer = AutoTokenizer.from_pretrained(model_id, use_auth_token=token)
         llama_pipeline = pipeline("text-generation", model=model, tokenizer=tokenizer)
         system_prompt = (
+    "You are an expert radio imaging producer specializing in sound design and music. "
+    "Take the user's concept and craft a concise, creative promo script with a strong focus on auditory elements and musical appeal."
+)
         combined_prompt = f"{system_prompt}\nUser concept: {user_prompt}\nRefined script:"
         result = llama_pipeline(combined_prompt, max_new_tokens=200, do_sample=True, temperature=0.9)
         return result[0]["generated_text"].split("Refined script:")[-1].strip()
 # Interface
 # ---------------------------------------------------------------------
 with gr.Blocks() as demo:
+    # Header
+    gr.Markdown("""
+        # 🎙️ AI-Powered Radio Imaging Studio 🚀
+        ### Create stunning **radio promos** with **Llama 3** and **MusicGen**
+        🔥 **Zero GPU** integration for efficiency and ease!
+    """)
+    # Script Generation Section
+    gr.Markdown("## ✍️ Step 1: Generate Your Promo Script")
     with gr.Row():
         user_prompt = gr.Textbox(
+            label="🎤 Enter Promo Idea",
+            placeholder="E.g., A 15-second energetic jingle for a morning talk show.",
+            lines=2,
+            info="Describe your promo idea clearly to generate a creative script."
         )
         llama_model_id = gr.Textbox(
+            label="🎛️ Llama 3 Model ID",
+            value="meta-llama/Meta-Llama-3-8B-Instruct",
+            info="Enter the Hugging Face model ID for Llama 3."
         )
+    generate_script_button = gr.Button("Generate Script ✨")
+    script_output = gr.Textbox(
+        label="📜 Generated Promo Script",
+        lines=4,
+        interactive=False,
+        info="Your generated promo script will appear here."
+    )
+    # Audio Generation Section
+    gr.Markdown("## 🎧 Step 2: Generate Audio from Your Script")
+    with gr.Row():
+        audio_length = gr.Slider(
+            label="🎵 Audio Length (tokens)",
+            minimum=128,
+            maximum=1024,
+            step=64,
+            value=512,
+            info="Select the desired audio token length."
+        )
+    generate_audio_button = gr.Button("Generate Audio 🎶")
+    audio_output = gr.Audio(
+        label="🎶 Generated Audio File",
+        type="filepath",
+        interactive=False,
+        info="Listen to the audio file generated from your script."
+    )
+    # Footer
+    gr.Markdown("""
+        <br><hr>
+        <p style="text-align: center; font-size: 0.9em;">
+            Created with ❤️ by <a href="https://bilsimaging.com" target="_blank">bilsimaging.com</a>
+        </p>
+    """, elem_id="footer")
+    # Button Actions
     generate_script_button.click(
         fn=interface_generate_script,
         inputs=[user_prompt, llama_model_id],