Final_Assignment_Project

Runtime error

wt002 commited on 8 days ago

Commit

606a4f5

verified ·

1 Parent(s): 499242c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,6 @@ import requests
 from typing import List, Dict, Union
 import pandas as pd
 import wikipediaapi
-from pdfminer.high_level import extract_text
 from docx import Document
 load_dotenv()
@@ -74,11 +73,14 @@ class BasicAgent:
     def _process_pdf(self, file_path: str) -> str:
-        """Extract text from PDF using pdfminer.six (no PyPDF2/pypdf needed)."""
         try:
-            return extract_text(file_path)
         except Exception as e:
-            return f"PDF processing error: {str(e)}"
     def __call__(self, query: str) -> str:

 from typing import List, Dict, Union
 import pandas as pd
 import wikipediaapi
 from docx import Document
 load_dotenv()
     def _process_pdf(self, file_path: str) -> str:
+        """Fallback PDF text extraction (works for simple PDFs)."""
         try:
+            # Read raw binary data and decode text (very basic)
+            with open(file_path, 'rb') as f:
+                text = f.read().decode('latin-1')  # Try UTF-8 if this fails
+                return text if text.strip() else "PDF text not extractable (install pdfminer.six for better results)"
         except Exception as e:
+            return f"PDF read error: {str(e)}"
     def __call__(self, query: str) -> str: