Final_Assignment_Project

Runtime error

wt002 commited on 8 days ago

Commit

1e33f11

verified ·

1 Parent(s): 3102ee4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ import requests
 from typing import List, Dict, Union
 import pandas as pd
 import wikipediaapi
-import PyPDF
 from docx import Document
 load_dotenv()
@@ -72,26 +72,24 @@ class BasicAgent:
         page = self.wiki.page(query)
         return page.summary if page.exists() else "No Wikipedia page found"
-    def process_document(self, file_path: str) -> str:
-        """Extract text from PDF (works with PyPDF2 or pypdf)"""
-        if not os.path.exists(file_path):
-            return "File not found"
-        if file_path.lower().endswith('.pdf'):
             try:
-                # Try modern pypdf first
-                from pypdf import PdfReader
-            except ImportError:
-                # Fallback to PyPDF2
                 from PyPDF2 import PdfReader
-            try:
-                with open(file_path, 'rb') as f:
-                    reader = PdfReader(f)
-                    text = "\n".join([page.extract_text() for page in reader.pages])
-                    return text if text.strip() else "PDF has no extractable text"
-            except Exception as e:
-                return f"PDF processing error: {str(e)}"
     def __call__(self, query: str) -> str:

 from typing import List, Dict, Union
 import pandas as pd
 import wikipediaapi
+from pypdf import PdfReader
 from docx import Document
 load_dotenv()
         page = self.wiki.page(query)
         return page.summary if page.exists() else "No Wikipedia page found"
+    def extract_pdf_text(file_path: str) -> str:
+        """Works with both pypdf and PyPDF2."""
+        try:
+            # Prefer 'pypdf' (newer)
+            from pypdf import PdfReader
+        except ImportError:
             try:
+                # Fallback to 'PyPDF2'
                 from PyPDF2 import PdfReader
+            except ImportError:
+                return "Error: Install 'pypdf' or 'PyPDF2' first (pip install pypdf)."
+        try:
+            with open(file_path, 'rb') as f:
+                reader = PdfReader(f)
+                return "\n".join(page.extract_text() for page in reader.pages)
+        except Exception as e:
+            return f"Failed to read PDF: {str(e)}"
     def __call__(self, query: str) -> str: