Final_Assignment_Template

Sleeping

dlaima commited on Jun 2

Commit

5c5f32d

verified ·

1 Parent(s): 02a5e73

Update image_analyzer.py

Files changed (1) hide show

image_analyzer.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import base64
 import openai
 from smolagents import Tool
@@ -6,23 +7,27 @@ class ImageAnalysisTool(Tool):
     name = "image_analysis"
     description = "Analyze the content of an image and answer a specific question about it."
     inputs = {
-        "image_path": {
             "type": "string",
-            "description": "Path to the image file (jpg, png, etc.)"
         },
         "question": {
             "type": "string",
-            "description": "A question about the image content"
         }
     }
     output_type = "string"
-    def __init__(self):
-        super().__init__()
-    def forward(self, image_path: str, question: str) -> str:
-        base64_image = self.encode_image(image_path)
         try:
             response = openai.ChatCompletion.create(
                 model="gpt-4-turbo",
                 messages=[
@@ -41,7 +46,7 @@ class ImageAnalysisTool(Tool):
                 ],
                 max_tokens=300
             )
-            return response["choices"][0]["message"]["content"]
         except Exception as e:
             return f"Error analyzing image: {e}"
@@ -50,4 +55,5 @@ class ImageAnalysisTool(Tool):
             return base64.b64encode(image_file.read()).decode("utf-8")

 import base64
+import requests
 import openai
 from smolagents import Tool
     name = "image_analysis"
     description = "Analyze the content of an image and answer a specific question about it."
     inputs = {
+        "url": {
             "type": "string",
+            "description": "URL to the image"
         },
         "question": {
             "type": "string",
+            "description": "Question about the image content"
         }
     }
     output_type = "string"
+    def forward(self, url: str, question: str) -> str:
         try:
+            # Download image
+            image_path = "/tmp/image_input.jpg"
+            r = requests.get(url)
+            with open(image_path, "wb") as f:
+                f.write(r.content)
+            # Encode & analyze
+            base64_image = self.encode_image(image_path)
             response = openai.ChatCompletion.create(
                 model="gpt-4-turbo",
                 messages=[
                 ],
                 max_tokens=300
             )
+            return response["choices"][0]["message"]["content"].strip()
         except Exception as e:
             return f"Error analyzing image: {e}"
             return base64.b64encode(image_file.read()).decode("utf-8")