First_agent_template

Sleeping

App Files Files Community

Ferocious0xide commited on Feb 17

Commit

daaf1a3

verified ·

1 Parent(s): df2f655

Update tools/arxiv_tool.py

Browse files

Files changed (1) hide show

tools/arxiv_tool.py +62 -38

tools/arxiv_tool.py CHANGED Viewed

@@ -13,10 +13,10 @@ class ArxivSearchTool(Tool):
         'query': {'type': 'string', 'description': 'The search query for papers'},
         'max_results': {'type': 'integer', 'description': 'Maximum number of results to return'}
     }
-    output_type = List[Dict]
     def forward(self, query: str = "artificial intelligence",
-              max_results: int = 50) -> List[Dict]:
         try:
             # Construct the API URL
             base_url = 'http://export.arxiv.org/api/query?'
@@ -40,48 +40,72 @@ class ArxivSearchTool(Tool):
             ns = {'atom': 'http://www.w3.org/2005/Atom',
                   'arxiv': 'http://arxiv.org/schemas/atom'}
-            results = []
             for entry in root.findall('atom:entry', ns):
-                # Extract paper details
-                result = {
-                    'title': entry.find('atom:title', ns).text.strip(),
-                    'authors': [author.find('atom:name', ns).text
-                              for author in entry.findall('atom:author', ns)],
-                    'summary': entry.find('atom:summary', ns).text.strip() if entry.find('atom:summary', ns) is not None else '',
-                    'published': entry.find('atom:published', ns).text.strip(),
-                    'id': entry.find('atom:id', ns).text.strip(),
-                    'pdf_url': next((link.get('href') for link in entry.findall('atom:link', ns)
-                                   if link.get('type') == 'application/pdf'), None),
-                    'categories': [cat.get('term') for cat in entry.findall('atom:category', ns)]
-                }
-                results.append(result)
-            return results
         except Exception as e:
-            return [{"error": f"Error searching ArXiv: {str(e)}"}]
 class LatestPapersTool(Tool):
     name = "get_latest_papers"
     description = "Get papers from the last N days from saved results"
     inputs = {'days_back': {'type': 'integer', 'description': 'Number of days to look back'}}
-    output_type = List[Dict]
-    def forward(self, days_back: int = 1) -> List[Dict]:
-        papers = []
-        base_dir = "daily_papers"
-        # Get dates to check
-        dates = [
-            (datetime.now() - timedelta(days=i)).strftime("%Y-%m-%d")
-            for i in range(days_back)
-        ]
-        # Load papers for each date
-        for date in dates:
-            file_path = os.path.join(base_dir, f"ai_papers_{date}.json")
-            if os.path.exists(file_path):
-                with open(file_path, 'r', encoding='utf-8') as f:
-                    day_papers = json.load(f)
-                    papers.extend(day_papers)
-        return papers

         'query': {'type': 'string', 'description': 'The search query for papers'},
         'max_results': {'type': 'integer', 'description': 'Maximum number of results to return'}
     }
+    output_type = "string"
     def forward(self, query: str = "artificial intelligence",
+              max_results: int = 50) -> str:
         try:
             # Construct the API URL
             base_url = 'http://export.arxiv.org/api/query?'
             ns = {'atom': 'http://www.w3.org/2005/Atom',
                   'arxiv': 'http://arxiv.org/schemas/atom'}
+            # Format results as a string
+            formatted_results = "## ArXiv Search Results\n\n"
             for entry in root.findall('atom:entry', ns):
+                title = entry.find('atom:title', ns).text.strip()
+                authors = [author.find('atom:name', ns).text
+                          for author in entry.findall('atom:author', ns)]
+                summary = entry.find('atom:summary', ns).text.strip() if entry.find('atom:summary', ns) is not None else ''
+                published = entry.find('atom:published', ns).text.strip()
+                paper_id = entry.find('atom:id', ns).text.strip()
+                pdf_url = next((link.get('href') for link in entry.findall('atom:link', ns)
+                              if link.get('type') == 'application/pdf'), None)
+                categories = [cat.get('term') for cat in entry.findall('atom:category', ns)]
+                formatted_results += f"### {title}\n"
+                formatted_results += f"- Authors: {', '.join(authors)}\n"
+                formatted_results += f"- Published: {published}\n"
+                formatted_results += f"- Categories: {', '.join(categories)}\n"
+                formatted_results += f"- PDF: {pdf_url}\n"
+                formatted_results += f"- Summary: {summary}\n\n"
+            return formatted_results
         except Exception as e:
+            return f"Error searching ArXiv: {str(e)}"
 class LatestPapersTool(Tool):
     name = "get_latest_papers"
     description = "Get papers from the last N days from saved results"
     inputs = {'days_back': {'type': 'integer', 'description': 'Number of days to look back'}}
+    output_type = "string"
+    def forward(self, days_back: int = 1) -> str:
+        try:
+            papers = []
+            base_dir = "daily_papers"
+            # Get dates to check
+            dates = [
+                (datetime.now() - timedelta(days=i)).strftime("%Y-%m-%d")
+                for i in range(days_back)
+            ]
+            # Load papers for each date
+            for date in dates:
+                file_path = os.path.join(base_dir, f"ai_papers_{date}.json")
+                if os.path.exists(file_path):
+                    with open(file_path, 'r', encoding='utf-8') as f:
+                        day_papers = json.load(f)
+                        papers.extend(day_papers)
+            # Format results as a string
+            formatted_results = f"## Latest Papers (Past {days_back} days)\n\n"
+            for paper in papers:
+                formatted_results += f"### {paper.get('title', 'Untitled')}\n"
+                formatted_results += f"- Authors: {', '.join(paper.get('authors', ['Unknown']))}\n"
+                formatted_results += f"- Published: {paper.get('published', 'Unknown')}\n"
+                formatted_results += f"- Categories: {', '.join(paper.get('categories', []))}\n"
+                if paper.get('pdf_url'):
+                    formatted_results += f"- PDF: {paper['pdf_url']}\n"
+                if paper.get('summary'):
+                    formatted_results += f"- Summary: {paper['summary']}\n"
+                formatted_results += "\n"
+            return formatted_results if papers else f"No papers found in the last {days_back} days."
+        except Exception as e:
+            return f"Error getting latest papers: {str(e)}"