Spaces:

Ujeshhh
/

image-captioning

Sleeping

Ujeshhh commited on Apr 2

Commit

410478b

verified ·

1 Parent(s): 3c6c0fd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,31 +1,35 @@
 import openai
 import gradio as gr
 import os
 # Set your OpenAI API Key
 openai.api_key = "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"  # Replace with your API key
 def generate_caption(image):
     """Generate a caption for the uploaded image using OpenAI's GPT-4 Vision API."""
     with open(image, "rb") as img_file:
-        response = openai.chat.completions.create(
-            model="gpt-4-turbo",
-            messages=[
-                {
-                    "role": "system",
-                    "content": "You are an AI assistant that describes images accurately."
-                },
-                {
-                    "role": "user",
-                    "content": [
-                        {"type": "text", "text": "Describe the contents of this image in detail."},
-                        {"type": "image_url", "image_url": {"url": "data:image/jpeg;base64," + img_file.read().decode()}},
-                    ],
-                },
-            ],
-            max_tokens=100
-        )
     caption = response.choices[0].message.content
     return caption

 import openai
 import gradio as gr
 import os
+import base64
 # Set your OpenAI API Key
 openai.api_key = "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"  # Replace with your API key
 def generate_caption(image):
     """Generate a caption for the uploaded image using OpenAI's GPT-4 Vision API."""
+    # Convert image to Base64
     with open(image, "rb") as img_file:
+        img_base64 = base64.b64encode(img_file.read()).decode("utf-8")
+    # OpenAI API call
+    response = openai.chat.completions.create(
+        model="gpt-4-turbo",
+        messages=[
+            {"role": "system", "content": "You are an AI that describes images accurately."},
+            {
+                "role": "user",
+                "content": [
+                    {"type": "text", "text": "Describe this image in detail."},
+                    {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{img_base64}"}},
+                ],
+            },
+        ],
+        max_tokens=100
+    )
+    # Extract and return caption
     caption = response.choices[0].message.content
     return caption