CPS-Test-Mobile

Paused

Ali2206 commited on Apr 10

Commit

2737da8

verified ·

1 Parent(s): e69f295

Update ui/ui_core.py

Files changed (1) hide show

ui/ui_core.py CHANGED Viewed

@@ -42,21 +42,24 @@ def extract_all_text_from_csv_or_excel(file_path: str, progress=None, index=0, t
         df = None
         if file_path.endswith(".csv"):
-            df = pd.read_csv(file_path, encoding_errors="replace", dtype=str, header=None)
         elif file_path.endswith((".xls", ".xlsx")):
             try:
-                df = pd.read_excel(file_path, engine="openpyxl", dtype=str, header=None)
             except:
-                df = pd.read_excel(file_path, engine="xlrd", dtype=str, header=None)
         if df is None or df.empty:
             return f"[Warning] No data extracted from: {file_path}"
         lines = []
         for _, row in df.iterrows():
-            line = " | ".join(str(cell) for cell in row if pd.notna(cell))
             if line:
                 lines.append(line)
         return f"\U0001F4C4 {os.path.basename(file_path)}\n\n" + "\n".join(lines)
     except Exception as e:

         df = None
         if file_path.endswith(".csv"):
+            df = pd.read_csv(file_path, encoding_errors="replace", header=None, dtype=str, skip_blank_lines=False, on_bad_lines="skip")
         elif file_path.endswith((".xls", ".xlsx")):
             try:
+                df = pd.read_excel(file_path, engine="openpyxl", header=None, dtype=str)
             except:
+                df = pd.read_excel(file_path, engine="xlrd", header=None, dtype=str)
         if df is None or df.empty:
             return f"[Warning] No data extracted from: {file_path}"
+        df = df.fillna("")  # Handle missing data gracefully
         lines = []
         for _, row in df.iterrows():
+            line = " | ".join(str(cell) for cell in row if str(cell).strip())
             if line:
                 lines.append(line)
         return f"\U0001F4C4 {os.path.basename(file_path)}\n\n" + "\n".join(lines)
     except Exception as e: