Spaces:

Ujeshhh
/

image-captioning

Build error

App Files Files

xet

Community

Ujeshhh commited on Apr 2

Commit

55f0a1e

verified ·

1 Parent(s): 6579c7d

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -29

app.py CHANGED Viewed

@@ -1,36 +1,25 @@
-import openai
 import gradio as gr
-import os
-import base64
-# Set your OpenAI API Key
-openai.api_key = "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"  # Replace with your API key
 def generate_caption(image):
-    """Generate a caption for the uploaded image using OpenAI's GPT-4 Vision API."""
-    # Convert image to Base64
-    with open(image, "rb") as img_file:
-        img_base64 = base64.b64encode(img_file.read()).decode("utf-8")
-    # OpenAI API call
-    response = openai.chat.completions.create(
-        model="gpt-4o-mini",
-        messages=[
-            {"role": "system", "content": "You are an AI that describes images accurately."},
-            {
-                "role": "user",
-                "content": [
-                    {"type": "text", "text": "Describe this image in detail."},
-                    {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{img_base64}"}},
-                ],
-            },
-        ],
-        max_tokens=100
-    )
-    # Extract and return caption
-    caption = response.choices[0].message.content
     return caption
 # Gradio UI
@@ -38,8 +27,8 @@ iface = gr.Interface(
     fn=generate_caption,
     inputs=gr.Image(type="filepath"),
     outputs="text",
-    title="Image Captioning App",
-    description="Upload an image, and the AI will generate a descriptive caption."
 )
 # Run the app

+import google.generativeai as genai
 import gradio as gr
+from PIL import Image
+# Set up Gemini API key
+genai.configure(api_key="AIzaSyDnx_qUjGTFG1pv1otPUhNt_bGGv14aMDI")  # Replace with your API key
 def generate_caption(image):
+    """Generate a caption for the uploaded image using Google Gemini Pro Vision API."""
+    model = genai.GenerativeModel("gemini-pro-vision")
+    # Open image using PIL
+    img = Image.open(image)
+    # Generate caption
+    response = model.generate_content(
+        [img, "Describe the contents of this image in detail."]
+    )
+    # Extract caption
+    caption = response.text
     return caption
 # Gradio UI
     fn=generate_caption,
     inputs=gr.Image(type="filepath"),
     outputs="text",
+    title="Free Image Captioning App",
+    description="Upload an image, and the AI (Google Gemini) will generate a descriptive caption."
 )
 # Run the app