Test_Magus

Running

App Files Files Community

SergeyO7 commited on 17 days ago

Commit

5b72b9c

verified ·

1 Parent(s): ec01a22

Update agent.py

Browse files

Files changed (1) hide show

agent.py +21 -12

agent.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from smolagents import CodeAgent,  LiteLLMModel, tool, load_tool, DuckDuckGoSearchTool, WikipediaSearchTool #, HfApiModel, OpenAIServerModel
 import asyncio
 import os
 import yaml
 from PIL import Image
 import requests
@@ -35,23 +36,33 @@ import whisper
 #        return f"Error performing Google search: {str(e)}"
 @tool
-def ImageAnalysisTool(image_path: str) -> str:
-    """Tool for analyzing images using computer vision
     Args:
-        image_path (str): Path to image file
     Returns:
-        str: Image description
     """
     headers = {
-        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36"
     }
-    response = requests.get(image_path,headers=headers)
-    image = Image.open(BytesIO(response.content)).convert("RGB")
     model = LiteLLMModel(
         model_id="gemini/gemini-2.0-flash",
-        api_key= os.environ.get("GEMINI_KEY"),
         max_tokens=8192
     )
@@ -63,10 +74,8 @@ def ImageAnalysisTool(image_path: str) -> str:
     )
     response = agent.run(
-        """
-        Describe in details the chess position you see in the image.
-        """,
-        images=image
     )
     return f"The image description: '{response}'"

 from smolagents import CodeAgent,  LiteLLMModel, tool, load_tool, DuckDuckGoSearchTool, WikipediaSearchTool #, HfApiModel, OpenAIServerModel
 import asyncio
 import os
+import re
 import yaml
 from PIL import Image
 import requests
 #        return f"Error performing Google search: {str(e)}"
 @tool
+def ImageAnalysisTool(question: str) -> str:
+    """Tool for analyzing images mentioned in the question.
     Args:
+        question (str): The question text which may contain an image URL.
     Returns:
+        str: Image description or error message.
     """
+    # Extract URL from question using regex
+    url_pattern = r'https?://\S+'
+    match = re.search(url_pattern, question)
+    if not match:
+        return "No image URL found in the question."
+    image_url = match.group(0)
     headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36"
     }
+    try:
+        response = requests.get(image_url, headers=headers)
+        response.raise_for_status()
+        image = Image.open(BytesIO(response.content)).convert("RGB")
+    except Exception as e:
+        return f"Error fetching image: {e}"
     model = LiteLLMModel(
         model_id="gemini/gemini-2.0-flash",
+        api_key=os.environ.get("GEMINI_KEY"),
         max_tokens=8192
     )
     )
     response = agent.run(
+        "Describe in details the chess position you see in the image.",
+        images=[image]
     )
     return f"The image description: '{response}'"