Update app.py
Browse files
app.py
CHANGED
@@ -61,7 +61,16 @@ def load_docs(document_path):
|
|
61 |
)
|
62 |
documents = loader.load()
|
63 |
text_splitter = NLTKTextSplitter(chunk_size=1000)
|
64 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
65 |
except Exception as e:
|
66 |
st.error(f"Failed to load and process PDF: {e}")
|
67 |
st.stop()
|
|
|
61 |
)
|
62 |
documents = loader.load()
|
63 |
text_splitter = NLTKTextSplitter(chunk_size=1000)
|
64 |
+
split_docs = text_splitter.split_documents(documents)
|
65 |
+
|
66 |
+
# Filter metadata to only include str, int, float, or bool
|
67 |
+
for doc in split_docs:
|
68 |
+
if hasattr(doc, "metadata") and isinstance(doc.metadata, dict):
|
69 |
+
doc.metadata = {
|
70 |
+
k: v for k, v in doc.metadata.items()
|
71 |
+
if isinstance(v, (str, int, float, bool))
|
72 |
+
}
|
73 |
+
return split_docs
|
74 |
except Exception as e:
|
75 |
st.error(f"Failed to load and process PDF: {e}")
|
76 |
st.stop()
|