Spaces:

pradeepsengarr
/

Bot_RAG

Sleeping

pradeepsengarr commited on Apr 15

Commit

5256379

verified ·

1 Parent(s): 4977945

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -468,11 +468,29 @@ def split_text_into_chunks(text):
     splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
     return splitter.create_documents([text])
 # --- Create Vector DB ---
 def create_vectorstore(documents):
     model = SentenceTransformer("all-MiniLM-L6-v2", device='cpu')
     embeddings = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
-    db = Chroma.from_documents(documents, embeddings, persist_directory=persist_directory)
     db.persist()
     return db

     splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
     return splitter.create_documents([text])
+import os
+import tempfile
+import shutil
+from langchain.vectorstores import Chroma
+from langchain.embeddings import HuggingFaceEmbeddings
+from sentence_transformers import SentenceTransformer
 # --- Create Vector DB ---
 def create_vectorstore(documents):
+    # Setup a writable directory for Chroma
+    chroma_dir = os.path.join(tempfile.gettempdir(), "chroma_db")
+    if os.path.exists(chroma_dir):
+        shutil.rmtree(chroma_dir)  # Clear any old data
+    os.makedirs(chroma_dir, exist_ok=True)
+    # Initialize the model and embeddings
     model = SentenceTransformer("all-MiniLM-L6-v2", device='cpu')
     embeddings = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
+    # Create the Chroma database
+    db = Chroma.from_documents(documents, embeddings, persist_directory=chroma_dir)
+    # Persist the Chroma database
     db.persist()
     return db