Spaces:

mroccuper
/

Describer-Pro

Sleeping

App Files Files Community

mroccuper commited on May 6

Commit

70ebe1c

verified ·

1 Parent(s): 43c4d6f

Update app.py

Browse files

Files changed (1) hide show

app.py +86 -45

app.py CHANGED Viewed

@@ -10,7 +10,7 @@ from PIL import Image, ImageEnhance, ImageFilter
 # --- Environment Configuration ---
 GEMINI_KEY = os.environ.get("GEMINI_KEY", "")
 DEFAULT_PORT = int(os.environ.get("PORT", 7860))
-API_TIMEOUT = 120  # seconds
 # --- Style Template Optimization ---
 BASE_TEMPLATE = """Describe this design as a concise Flux 1.1 Pro prompt focusing on:
@@ -51,36 +51,39 @@ def preprocess_image(img):
 # --- Core Generation Engine ---
 def generate_prompt(image, api_key, style, creativity, neg_prompt, aspect, color_mode, dpi):
     try:
         if not image:
-            return {"error": "❌ Please upload an image"}
         api_key = api_key or GEMINI_KEY
         if not api_key:
-            return {"error": "❌ API key required - set GEMINI_KEY environment variable or use input field"}
-        # Lazy import for Gemini
         try:
             import google.generativeai as genai
             genai.configure(api_key=api_key)
             model = genai.GenerativeModel("gemini-1.5-pro")
         except ImportError:
-            return {"error": "❌ Install Gemini SDK: pip install google-generativeai"}
         except Exception as e:
             if "authentication" in str(e).lower():
-                return {"error": "❌ Invalid API key or authentication error"}
-            return {"error": f"❌ API initialization error: {str(e)}"}
-        # Image processing
         img = preprocess_image(image)
         img_bytes = io.BytesIO()
         img.save(img_bytes, format="PNG")
         img_b64 = base64.b64encode(img_bytes.getvalue()).decode()
-        # Prompt instruction
         instruction = f"{STYLE_INSTRUCTIONS[style]}\nAVOID: {neg_prompt}\n"
         instruction += f"ASPECT: {aspect}, COLORS: {color_mode}, DPI: {dpi}\n"
-        # Gemini generation
         try:
             response = model.generate_content(
                 contents=[instruction, {"mime_type": "image/png", "data": img_b64}],
@@ -88,41 +91,45 @@ def generate_prompt(image, api_key, style, creativity, neg_prompt, aspect, color
             )
             raw_prompt = response.text
         except Exception as e:
-            return {"error": f"❌ Prompt generation failed: {str(e)}"}
-        # Basic validation
         validation = {"score": 8, "issues": [], "suggestions": []}
-        input_tokens = len(img_b64) // 4  # Approximate
         output_tokens = len(raw_prompt.split())
-        return raw_prompt, validation, {
-            "input": input_tokens,
-            "output": output_tokens
         }
     except Exception as e:
         traceback.print_exc()
         return {"error": str(e)}
-# --- Response Formatter ---
 def format_generation_response(result):
     """Format the response from generate_prompt for the UI"""
     if "error" in result:
-        return result["error"], {}, {}
     else:
         return result.get("prompt", ""), result.get("validation", {}), result.get("stats", {})
-def update_status(result):
-    return "✅ Prompt generated successfully!" if "prompt" in result else result.get("error", "❌ Unknown error")
 # --- Main Interface ---
 def build_interface():
-    with gr.Blocks(title="Flux Pro Generator") as app:
         # Header
         gr.Markdown("# 🎨 Flux Pro Prompt Generator")
         gr.Markdown("Generate optimized design prompts from images using Google's Gemini")
-        # API Key
         api_key = gr.Textbox(
             label="🔑 Gemini API Key",
             value=GEMINI_KEY,
@@ -130,42 +137,76 @@ def build_interface():
             info="Set GEMINI_KEY environment variable for production"
         )
-        # Inputs
         with gr.Row():
             with gr.Column(scale=1):
-                img_input = gr.Image(label="🖼️ Upload Design", type="pil", sources=["upload"], interactive=True)
-                style = gr.Dropdown(list(STYLE_INSTRUCTIONS.keys()), value="General", label="🎨 Target Style")
                 with gr.Accordion("⚙️ Advanced Settings", open=False):
-                    creativity = gr.Slider(0.0, 1.0, value=0.7, step=0.05, label="Creativity Level")
                     neg_prompt = gr.Textbox(label="🚫 Negative Prompts", placeholder="What to avoid")
                     aspect = gr.Dropdown(FLUX_SPECS["aspect_ratios"], value="1:1", label="Aspect Ratio")
                     color_mode = gr.Dropdown(FLUX_SPECS["color_modes"], value="RGB", label="Color Mode")
                     dpi = gr.Dropdown([str(d) for d in FLUX_SPECS["dpi_options"]], value="300", label="Output DPI")
                 gen_btn = gr.Button("✨ Generate Prompt", variant="primary")
             with gr.Column(scale=2):
-                prompt_output = gr.Textbox(label="📝 Optimized Prompt", lines=8, interactive=True, show_copy_button=True)
                 status_msg = gr.Textbox(label="Status", visible=True)
-                quality_report = gr.JSON(label="🔍 Quality Report", visible=True)
-                token_stats = gr.JSON(label="🧮 Token Usage", visible=True)
-        # Event bindings
         gen_btn.click(
             fn=generate_prompt,
-            inputs=[img_input, api_key, style, creativity, neg_prompt, aspect, color_mode, dpi],
-            outputs=None
         ).then(
-            fn=format_generation_response,
-            inputs=None,
-            outputs=[prompt_output, quality_report, token_stats]
-        ).then(
-            fn=update_status,
-            inputs=[prompt_output],
-            outputs=[status_msg]
         )
     return app
-# --- Launch App ---
 if __name__ == "__main__":
     app = build_interface()
-    app.launch(server_port=DEFAULT_PORT)

 # --- Environment Configuration ---
 GEMINI_KEY = os.environ.get("GEMINI_KEY", "")
 DEFAULT_PORT = int(os.environ.get("PORT", 7860))
+API_TIMEOUT = 30  # seconds
 # --- Style Template Optimization ---
 BASE_TEMPLATE = """Describe this design as a concise Flux 1.1 Pro prompt focusing on:
 # --- Core Generation Engine ---
 def generate_prompt(image, api_key, style, creativity, neg_prompt, aspect, color_mode, dpi):
     try:
+        # Validate inputs
         if not image:
+            return {"error": "Please upload an image"}
         api_key = api_key or GEMINI_KEY
         if not api_key:
+            return {"error": "API key required - set in env (GEMINI_KEY) or input field"}
+        # Import and configure Gemini only when needed
         try:
             import google.generativeai as genai
             genai.configure(api_key=api_key)
             model = genai.GenerativeModel("gemini-1.5-pro")
         except ImportError:
+            return {"error": "Failed to import google.generativeai. Install with: pip install google-generativeai"}
         except Exception as e:
             if "authentication" in str(e).lower():
+                return {"error": "Invalid API key or authentication error"}
+            else:
+                return {"error": f"API initialization error: {str(e)}"}
+        # Process image with timeout protection
+        start_time = time.time()
         img = preprocess_image(image)
         img_bytes = io.BytesIO()
         img.save(img_bytes, format="PNG")
         img_b64 = base64.b64encode(img_bytes.getvalue()).decode()
+        # Build instruction
         instruction = f"{STYLE_INSTRUCTIONS[style]}\nAVOID: {neg_prompt}\n"
         instruction += f"ASPECT: {aspect}, COLORS: {color_mode}, DPI: {dpi}\n"
+        # Generate prompt with timeout protection
         try:
             response = model.generate_content(
                 contents=[instruction, {"mime_type": "image/png", "data": img_b64}],
             )
             raw_prompt = response.text
         except Exception as e:
+            return {"error": f"Generation failed: {str(e)}"}
+        # Simple quality validation
         validation = {"score": 8, "issues": [], "suggestions": []}
+        # Token tracking
+        input_tokens = len(img_b64) // 4  # Approximate base64 token count
         output_tokens = len(raw_prompt.split())
+        return {
+            "prompt": raw_prompt,
+            "validation": validation,
+            "stats": {"input": input_tokens, "output": output_tokens}
         }
     except Exception as e:
         traceback.print_exc()
         return {"error": str(e)}
+# --- UI Response Formatting ---
 def format_generation_response(result):
     """Format the response from generate_prompt for the UI"""
     if "error" in result:
+        return result["error"], None, None
     else:
         return result.get("prompt", ""), result.get("validation", {}), result.get("stats", {})
+# Modern copy function using Gradio's JavaScript API
+def copy_text(text):
+    return gr.update(value=text), f"✓ Copied: '{text[:20]}...'", gr.Button.update(variant="secondary")
 # --- Main Interface ---
 def build_interface():
+    with gr.Blocks(title="Flux Pro Generator", theme="soft") as app:
         # Header
         gr.Markdown("# 🎨 Flux Pro Prompt Generator")
         gr.Markdown("Generate optimized design prompts from images using Google's Gemini")
+        # Security Section
         api_key = gr.Textbox(
             label="🔑 Gemini API Key",
             value=GEMINI_KEY,
             info="Set GEMINI_KEY environment variable for production"
         )
+        # Main Workflow
         with gr.Row():
             with gr.Column(scale=1):
+                img_input = gr.Image(
+                    label="🖼️ Upload Design",
+                    type="pil",
+                    sources=["upload"],
+                    interactive=True
+                )
+                style = gr.Dropdown(
+                    list(STYLE_INSTRUCTIONS.keys()),
+                    value="General",
+                    label="🎨 Target Style"
+                )
+                # Advanced Settings
                 with gr.Accordion("⚙️ Advanced Settings", open=False):
+                    creativity = gr.Slider(0.0, 1.0, 0.7, label="Creativity Level")
                     neg_prompt = gr.Textbox(label="🚫 Negative Prompts", placeholder="What to avoid")
                     aspect = gr.Dropdown(FLUX_SPECS["aspect_ratios"], value="1:1", label="Aspect Ratio")
                     color_mode = gr.Dropdown(FLUX_SPECS["color_modes"], value="RGB", label="Color Mode")
                     dpi = gr.Dropdown([str(d) for d in FLUX_SPECS["dpi_options"]], value="300", label="Output DPI")
                 gen_btn = gr.Button("✨ Generate Prompt", variant="primary")
             with gr.Column(scale=2):
+                prompt_output = gr.Textbox(
+                    label="📝 Optimized Prompt",
+                    lines=8,
+                    interactive=True,
+                    show_copy_button=True  # Modern Gradio has built-in copy button
+                )
                 status_msg = gr.Textbox(label="Status", visible=True)
+                with gr.Row():
+                    copy_btn = gr.Button("📋 Copy to Clipboard", variant="secondary")
+                quality_report = gr.JSON(
+                    label="🔍 Quality Report",
+                    visible=True
+                )
+                token_stats = gr.JSON(
+                    label="🧮 Token Usage",
+                    visible=True
+                )
+        # Event Handling
         gen_btn.click(
             fn=generate_prompt,
+            inputs=[
+                img_input, api_key, style, creativity,
+                neg_prompt, aspect, color_mode, dpi
+            ],
+            outputs=[prompt_output, quality_report, token_stats],
+            api_name="generate"
         ).then(
+            fn=lambda: gr.update(value="Generation complete!"),
+            outputs=status_msg
+        )
+        # Modern copy implementation
+        copy_btn.click(
+            fn=copy_text,
+            inputs=prompt_output,
+            outputs=[prompt_output, status_msg, copy_btn],
+            js="(text) => { if(text) { navigator.clipboard.writeText(text); } return [text]; }"
         )
     return app
+# --- Production Launch ---
 if __name__ == "__main__":
     app = build_interface()
+    app.launch()