Spaces:

Athspi
/

Gttg

Sleeping

App Files Files Community

Athspi commited on Mar 22

Commit

19af451

verified ·

1 Parent(s): b0a339e

Update app.py

Browse files

Files changed (1) hide show

app.py +87 -68

app.py CHANGED Viewed

@@ -19,24 +19,26 @@ os.makedirs(UPLOAD_FOLDER, exist_ok=True)
 os.makedirs(RESULT_FOLDER, exist_ok=True)
 def upload_image(image_data_url):
-    """Helper function to upload image to Gemini"""
     try:
         header, encoded = image_data_url.split(',', 1)
-    except ValueError:
-        raise ValueError("Invalid image data")
-    binary_data = base64.b64decode(encoded)
-    ext = ".png" if "png" in header.lower() else ".jpg"
-    temp_filename = secure_filename("temp_image" + ext)
-    temp_filepath = os.path.join(UPLOAD_FOLDER, temp_filename)
-    with open(temp_filepath, "wb") as f:
-        f.write(binary_data)
-    return client.files.upload(file=temp_filepath)
 def is_prohibited_request(uploaded_file, object_type):
-    """Check if request is to remove person/animal using gemini-2.0-flash-lite"""
     model = "gemini-2.0-flash-lite"
     parts = [
         types.Part.from_uri(file_uri=uploaded_file.uri, mime_type=uploaded_file.mime_type),
@@ -46,14 +48,23 @@ def is_prohibited_request(uploaded_file, object_type):
     contents = [types.Content(role="user", parts=parts)]
     generate_content_config = types.GenerateContentConfig(
-        system_instruction=[
-            types.Part.from_text(text="""Determine if the user wants to remove a person or animal.
-            Respond ONLY with 'Yes' or 'No'. Consider these examples:
-            - Remove person → Yes
-            - Remove dog → Yes
-            - Remove sunglasses → No
-            - Remove background → No""")
-        ],
         temperature=0.0,
         max_output_tokens=1,
     )
@@ -66,49 +77,53 @@ def is_prohibited_request(uploaded_file, object_type):
         )
         if response.candidates and response.candidates[0].content.parts:
             return response.candidates[0].content.parts[0].text.strip().lower() == "yes"
-        return False
     except Exception as e:
-        print(f"Prohibition check error: {str(e)}")
-        return False
-def generate_gemini_output(object_type, uploaded_file):
-    """Generate image using gemini-2.0-flash-exp-image-generation"""
     model = "gemini-2.0-flash-exp-image-generation"
     parts = [
         types.Part.from_uri(file_uri=uploaded_file.uri, mime_type=uploaded_file.mime_type),
-        types.Part.from_text(text=f"Remove {object_type} from the image")
     ]
     contents = [types.Content(role="user", parts=parts)]
     generate_content_config = types.GenerateContentConfig(
-        temperature=1,
-        top_p=0.95,
-        top_k=40,
-        max_output_tokens=8192,
-        response_modalities=["image", "text"],
         safety_settings=[
-            types.SafetySetting(category="HARM_CATEGORY_CIVIC_INTEGRITY", threshold="OFF"),
-        ],
     )
-    result_image = None
-    for chunk in client.models.generate_content_stream(
-        model=model,
-        contents=contents,
-        config=generate_content_config,
-    ):
-        if chunk.candidates and chunk.candidates[0].content.parts:
-            part = chunk.candidates[0].content.parts[0]
-            if part.inline_data:
-                file_extension = mimetypes.guess_extension(part.inline_data.mime_type) or ".png"
-                output_filename = secure_filename("generated_output" + file_extension)
-                result_image_path = os.path.join(RESULT_FOLDER, output_filename)
-                with open(result_image_path, "wb") as f:
-                    f.write(part.inline_data.data)
-                result_image = result_image_path
-    return result_image
 @app.route("/")
 def index():
@@ -117,36 +132,40 @@ def index():
 @app.route("/process", methods=["POST"])
 def process():
     try:
-        data = request.get_json(force=True)
-        image_data = data.get("image")
-        object_type = data.get("objectType", "").strip()
-        if not image_data or not object_type:
-            return jsonify({"success": False, "message": "Missing required data"}), 400
-        # Upload image once
         uploaded_file = upload_image(image_data)
-        # Check for prohibited requests
         if is_prohibited_request(uploaded_file, object_type):
             return jsonify({
                 "success": False,
-                "message": "Sorry, I can't assist with removing people or animals."
-            }), 400
-        # Generate output if allowed
-        result_image = generate_gemini_output(object_type, uploaded_file)
-        if not result_image:
             return jsonify({"success": False, "message": "Failed to generate image"}), 500
         return jsonify({
             "success": True,
-            "resultPath": f"/static/{os.path.basename(result_image)}"
         })
     except Exception as e:
-        return jsonify({"success": False, "message": f"Error: {str(e)}"}), 500
 if __name__ == "__main__":
-    app.run(host="0.0.0.0", port=7860)

 os.makedirs(RESULT_FOLDER, exist_ok=True)
 def upload_image(image_data_url):
+    """Handle base64 image upload and Gemini file upload"""
     try:
         header, encoded = image_data_url.split(',', 1)
+        binary_data = base64.b64decode(encoded)
+        ext = ".png" if "png" in header.lower() else ".jpg"
+        temp_filename = secure_filename(f"temp_{os.urandom(8).hex()}{ext}")
+        temp_filepath = os.path.join(UPLOAD_FOLDER, temp_filename)
+        with open(temp_filepath, "wb") as f:
+            f.write(binary_data)
+        uploaded_file = client.files.upload(file=temp_filepath)
+        os.remove(temp_filepath)  # Clean up temporary file
+        return uploaded_file
+    except Exception as e:
+        raise ValueError(f"Image processing error: {str(e)}")
 def is_prohibited_request(uploaded_file, object_type):
+    """Check if request involves people/animals or their belongings"""
     model = "gemini-2.0-flash-lite"
     parts = [
         types.Part.from_uri(file_uri=uploaded_file.uri, mime_type=uploaded_file.mime_type),
     contents = [types.Content(role="user", parts=parts)]
     generate_content_config = types.GenerateContentConfig(
+        system_instruction=[types.Part.from_text(text="""Analyze image and request to detect:
+1. Direct removal of people/animals
+2. Removal of items attached to/worn by people/animals
+3. Removal of body parts or personal belongings
+Prohibited examples:
+- Person, dog, cat
+- Sunglasses on face, mask, hat
+- Phone in hand, watch on wrist
+- Eyes, hands, hair
+Allowed examples:
+- Background, car, tree
+- Sunglasses on table
+- Phone on desk
+Respond ONLY with 'Yes' or 'No'""")],
         temperature=0.0,
         max_output_tokens=1,
     )
         )
         if response.candidates and response.candidates[0].content.parts:
             return response.candidates[0].content.parts[0].text.strip().lower() == "yes"
+        return True  # Default to safe mode if uncertain
     except Exception as e:
+        print(f"Safety check failed: {str(e)}")
+        return True  # Block if check fails
+def generate_modified_image(uploaded_file, object_type):
+    """Generate image with object removed using experimental model"""
     model = "gemini-2.0-flash-exp-image-generation"
     parts = [
         types.Part.from_uri(file_uri=uploaded_file.uri, mime_type=uploaded_file.mime_type),
+        types.Part.from_text(text=f"Completely remove {object_type} from the image without leaving traces")
     ]
     contents = [types.Content(role="user", parts=parts)]
     generate_content_config = types.GenerateContentConfig(
+        temperature=0.5,
+        top_p=0.9,
+        max_output_tokens=1024,
+        response_modalities=["image"],
         safety_settings=[
+            types.SafetySetting(category="HARM_CATEGORY_CIVIC_INTEGRITY", threshold="BLOCK_NONE"),
+            types.SafetySetting(category="HARM_CATEGORY_VIOLENCE", threshold="BLOCK_NONE")
+        ]
     )
+    try:
+        for chunk in client.models.generate_content_stream(
+            model=model,
+            contents=contents,
+            config=generate_content_config,
+        ):
+            if chunk.candidates and chunk.candidates[0].content.parts:
+                part = chunk.candidates[0].content.parts[0]
+                if part.inline_data:
+                    ext = mimetypes.guess_extension(part.inline_data.mime_type) or ".png"
+                    output_filename = secure_filename(f"result_{os.urandom(4).hex()}{ext}")
+                    output_path = os.path.join(RESULT_FOLDER, output_filename)
+                    with open(output_path, "wb") as f:
+                        f.write(part.inline_data.data)
+                    return output_path
+        return None
+    except Exception as e:
+        print(f"Image generation failed: {str(e)}")
+        return None
 @app.route("/")
 def index():
 @app.route("/process", methods=["POST"])
 def process():
     try:
+        data = request.get_json()
+        if not data or "image" not in data or "objectType" not in data:
+            return jsonify({"success": False, "message": "Invalid request format"}), 400
+        image_data = data["image"]
+        object_type = data["objectType"].strip().lower()
+        if not object_type:
+            return jsonify({"success": False, "message": "Please specify an object to remove"}), 400
+        # Process image upload
         uploaded_file = upload_image(image_data)
+        # Safety check
         if is_prohibited_request(uploaded_file, object_type):
             return jsonify({
                 "success": False,
+                "message": "Cannot remove people, animals, or personal items"
+            }), 403
+        # Generate modified image
+        result_path = generate_modified_image(uploaded_file, object_type)
+        if not result_path:
             return jsonify({"success": False, "message": "Failed to generate image"}), 500
         return jsonify({
             "success": True,
+            "resultUrl": f"/static/{os.path.basename(result_path)}"
         })
+    except ValueError as e:
+        return jsonify({"success": False, "message": str(e)}), 400
     except Exception as e:
+        return jsonify({"success": False, "message": "Internal server error"}), 500
 if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=7860,)