Spaces:

CognizantAI
/

marketing-image-generator

Running

App Files Files Community

Noo88ear commited on 13 days ago

Commit

b240d03

verified ·

1 Parent(s): ac520ab

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -19

app.py CHANGED Viewed

@@ -62,7 +62,7 @@ except ImportError:
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-# Get API keys - prioritize HuggingFace Secrets
 GCP_KEYS = [
     # Hugging Face Secrets (these are the primary ones for HF deployment)
     os.getenv("GOOGLE_API_KEY"),
@@ -96,14 +96,14 @@ def enhance_prompt_with_gemini(prompt: str, style: str) -> str:
         style (str): The desired image style
     Returns:
-        str: Enhanced prompt optimized for image generation
     """
     if not GEMINI_AVAILABLE or not GOOGLE_API_KEY:
         # Basic enhancement without Gemini
         style_enhancers = {
             "realistic": "photorealistic, high detail, professional photography, sharp focus",
             "artistic": "artistic masterpiece, creative composition, painterly style",
-            "cartoon": "cartoon style, vibrant colors, playful, animated character design",
             "photographic": "professional photograph, high quality, detailed, commercial photography",
             "illustration": "digital illustration, clean vector art, modern design"
         }
@@ -139,7 +139,7 @@ def enhance_prompt_with_gemini(prompt: str, style: str) -> str:
         style_enhancers = {
             "realistic": "photorealistic, high detail, professional photography",
             "artistic": "artistic masterpiece, creative composition",
-            "cartoon": "cartoon style, vibrant colors, playful",
             "photographic": "professional photograph, high quality, detailed",
             "illustration": "digital illustration, clean design"
         }
@@ -169,18 +169,22 @@ def generate_marketing_image(prompt: str, style: str = "realistic") -> str:
                 logger.info("🎨 Using Google Genai SDK for image generation")
                 logger.info(f"API Key available: {GOOGLE_API_KEY[:10]}...")
-                # Initialize the genai SDK client
                 client = genai_sdk.Client(api_key=GOOGLE_API_KEY)
-                # Generate image using Imagen 4.0 with reduced safety filtering
                 result = client.models.generate_images(
                     model="imagen-4.0-generate-preview-06-06",
                     prompt=enhanced_prompt,
                     config={
                         "number_of_images": 1,
                         "output_mime_type": "image/png",
-                        "safety_filter_level": "block_low_and_above",
-                        "include_safety_attributes": False
                     }
                 )
@@ -244,9 +248,9 @@ def generate_marketing_image(prompt: str, style: str = "realistic") -> str:
             "style": style
         })
-def analyze_marketing_image_with_gemini(image_url: str, prompt: str, review_guidelines: str = "") -> str:
     """
-    Analyze a generated marketing image using Gemini Vision for quality, relevance, and compliance.
     Args:
         image_url (str): URL or base64 data of the generated image
@@ -272,7 +276,7 @@ def analyze_marketing_image_with_gemini(image_url: str, prompt: str, review_guid
         CRITICAL MARKETING CHECKS:
         1. **Language/Text Requirements**: If guidelines mention "English" or specific language requirements, verify ALL visible text matches
-        2. **Brand Compliance**: Check professional appearance, color consistency, readability
         3. **Marketing Effectiveness**: Assess visual appeal and message clarity
         4. **Target Audience**: Evaluate cultural appropriateness and accessibility
@@ -502,9 +506,9 @@ def generate_and_review_marketing_image(prompt: str, style: str = "realistic", r
                 })
                 continue
-            # Step 2: Analyze the generated image with Gemini Vision
             image_url = generation_data.get("image_url", "")
-            analysis_response = analyze_marketing_image_with_gemini(image_url, prompt, review_guidelines)
             analysis_data = json.loads(analysis_response)
             current_score = analysis_data.get("overall_score", 0.0)
@@ -612,8 +616,10 @@ def process_generated_image_and_results(api_response_str: str) -> Tuple[Image.Im
             # Add specific documentation links for common errors
             doc_link = ""
-            if any(brand in error_msg.lower() for brand in ['hsbc', 'bank', 'political', 'timeout', 'stall']):
-                doc_link = "\n\n📖 See content restrictions guide: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#content-policy--brand-restrictions"
             elif 'api' in error_msg.lower() or 'key' in error_msg.lower():
                 doc_link = "\n\n📖 See API troubleshooting: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#common-issues"
@@ -731,7 +737,7 @@ def gradio_generate_marketing_image(prompt: str, style: str, max_retries: int, r
         )
         return process_generated_image_and_results(result_json)
     except Exception as e:
-        error_message = f"❌ Error: {str(e)}\n\n📖 For troubleshooting help, see: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#content-policy--brand-restrictions"
         logger.error(error_message)
         return None, error_message
@@ -739,10 +745,10 @@ def gradio_generate_marketing_image(prompt: str, style: str, max_retries: int, r
 SUGGESTED_PROMPTS = {
     "Modern office team collaboration": ("A modern office space with diverse professionals collaborating around a sleek conference table, natural lighting, professional attire, English signage visible", "realistic"),
     "Executive boardroom meeting": ("Professional executive boardroom with polished conference table, city skyline view, business documents, English presentations on screens", "realistic"),
-    "Customer service excellence": ("Professional customer service representative with headset in modern call center, English signage, clean corporate environment", "realistic"),
     "Product showcase display": ("Clean product showcase on white background with professional lighting, English product labels, minimalist marketing aesthetic", "realistic"),
-    "Creative workspace design": ("Creative workspace with colorful design elements, inspirational English quotes on walls, modern furniture, artistic marketing materials", "artistic"),
-    "Brand presentation setup": ("Professional brand presentation setup with English branded materials, corporate colors, marketing displays, conference room setting", "realistic")
 }
 # Create Gradio interface

 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# Get API keys - prioritise HuggingFace Secrets
 GCP_KEYS = [
     # Hugging Face Secrets (these are the primary ones for HF deployment)
     os.getenv("GOOGLE_API_KEY"),
         style (str): The desired image style
     Returns:
+        str: Enhanced prompt optimised for image generation
     """
     if not GEMINI_AVAILABLE or not GOOGLE_API_KEY:
         # Basic enhancement without Gemini
         style_enhancers = {
             "realistic": "photorealistic, high detail, professional photography, sharp focus",
             "artistic": "artistic masterpiece, creative composition, painterly style",
+            "cartoon": "cartoon style, vibrant colours, playful, animated character design",
             "photographic": "professional photograph, high quality, detailed, commercial photography",
             "illustration": "digital illustration, clean vector art, modern design"
         }
         style_enhancers = {
             "realistic": "photorealistic, high detail, professional photography",
             "artistic": "artistic masterpiece, creative composition",
+            "cartoon": "cartoon style, vibrant colours, playful",
             "photographic": "professional photograph, high quality, detailed",
             "illustration": "digital illustration, clean design"
         }
                 logger.info("🎨 Using Google Genai SDK for image generation")
                 logger.info(f"API Key available: {GOOGLE_API_KEY[:10]}...")
+                # Initialise the genai SDK client
                 client = genai_sdk.Client(api_key=GOOGLE_API_KEY)
+                # Generate image using Imagen 4.0 with optimised safety filtering
+                # Safety configuration: "block_low_and_above" - allows corporate/business content
+                # while maintaining essential safety guardrails. This setting significantly
+                # improves generation success for financial institutions, corporate brands,
+                # and marketing content while blocking genuinely harmful content.
                 result = client.models.generate_images(
                     model="imagen-4.0-generate-preview-06-06",
                     prompt=enhanced_prompt,
                     config={
                         "number_of_images": 1,
                         "output_mime_type": "image/png",
+                        "safety_filter_level": "block_low_and_above",  # Reduced from default strict filtering
+                        "include_safety_attributes": False  # Cleaner response without safety metadata
                     }
                 )
             "style": style
         })
+def analyse_marketing_image_with_gemini(image_url: str, prompt: str, review_guidelines: str = "") -> str:
     """
+    Analyse a generated marketing image using Gemini Vision for quality, relevance, and compliance.
     Args:
         image_url (str): URL or base64 data of the generated image
         CRITICAL MARKETING CHECKS:
         1. **Language/Text Requirements**: If guidelines mention "English" or specific language requirements, verify ALL visible text matches
+        2. **Brand Compliance**: Check professional appearance, colour consistency, readability
         3. **Marketing Effectiveness**: Assess visual appeal and message clarity
         4. **Target Audience**: Evaluate cultural appropriateness and accessibility
                 })
                 continue
+            # Step 2: Analyse the generated image with Gemini Vision
             image_url = generation_data.get("image_url", "")
+            analysis_response = analyse_marketing_image_with_gemini(image_url, prompt, review_guidelines)
             analysis_data = json.loads(analysis_response)
             current_score = analysis_data.get("overall_score", 0.0)
             # Add specific documentation links for common errors
             doc_link = ""
+            if any(keyword in error_msg.lower() for keyword in ['political', 'timeout', 'stall']):
+                doc_link = "\n\n📖 See updated safety configuration: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#content-policy--safety-configuration"
+            elif any(keyword in error_msg.lower() for keyword in ['hsbc', 'bank', 'corporate']):
+                doc_link = "\n\n💡 Note: Financial brands now work better with reduced safety filtering. See: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#improved-content-support"
             elif 'api' in error_msg.lower() or 'key' in error_msg.lower():
                 doc_link = "\n\n📖 See API troubleshooting: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#common-issues"
         )
         return process_generated_image_and_results(result_json)
     except Exception as e:
+        error_message = f"❌ Error: {str(e)}\n\n📖 For troubleshooting help, see: https://huggingface.co/spaces/CognizantAI/marketing-image-generator/blob/main/README.md#content-policy--safety-configuration"
         logger.error(error_message)
         return None, error_message
 SUGGESTED_PROMPTS = {
     "Modern office team collaboration": ("A modern office space with diverse professionals collaborating around a sleek conference table, natural lighting, professional attire, English signage visible", "realistic"),
     "Executive boardroom meeting": ("Professional executive boardroom with polished conference table, city skyline view, business documents, English presentations on screens", "realistic"),
+    "Customer service excellence": ("Professional customer service representative with headset in modern call centre, English signage, clean corporate environment", "realistic"),
     "Product showcase display": ("Clean product showcase on white background with professional lighting, English product labels, minimalist marketing aesthetic", "realistic"),
+    "Creative workspace design": ("Creative workspace with colourful design elements, inspirational English quotes on walls, modern furniture, artistic marketing materials", "artistic"),
+    "Brand presentation setup": ("Professional brand presentation setup with English branded materials, corporate colours, marketing displays, conference room setting", "realistic")
 }
 # Create Gradio interface