DrishtiSharma commited on
Commit
819c213
·
verified ·
1 Parent(s): 57c61b4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -1
app.py CHANGED
@@ -61,7 +61,16 @@ def load_docs(document_path):
61
  )
62
  documents = loader.load()
63
  text_splitter = NLTKTextSplitter(chunk_size=1000)
64
- return text_splitter.split_documents(documents)
 
 
 
 
 
 
 
 
 
65
  except Exception as e:
66
  st.error(f"Failed to load and process PDF: {e}")
67
  st.stop()
 
61
  )
62
  documents = loader.load()
63
  text_splitter = NLTKTextSplitter(chunk_size=1000)
64
+ split_docs = text_splitter.split_documents(documents)
65
+
66
+ # Filter metadata to only include str, int, float, or bool
67
+ for doc in split_docs:
68
+ if hasattr(doc, "metadata") and isinstance(doc.metadata, dict):
69
+ doc.metadata = {
70
+ k: v for k, v in doc.metadata.items()
71
+ if isinstance(v, (str, int, float, bool))
72
+ }
73
+ return split_docs
74
  except Exception as e:
75
  st.error(f"Failed to load and process PDF: {e}")
76
  st.stop()