Update app.py
Browse files
app.py
CHANGED
@@ -6,8 +6,8 @@ print(dataset)
|
|
6 |
|
7 |
from langchain.text_splitter import RecursiveCharacterTextSplitter
|
8 |
splitter = RecursiveCharacterTextSplitter(chunk_size=100, chunk_overlap=15,separators=["\n\n", "\n", " ", ""])
|
9 |
-
docs = splitter.split_documents(dataset)
|
10 |
-
|
11 |
|
12 |
|
13 |
from langchain_community.embeddings import HuggingFaceEmbeddings
|
@@ -18,7 +18,7 @@ embedding_model = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
|
|
18 |
from langchain_community.vectorstores import Chroma
|
19 |
persist_directory = 'docs/chroma/'
|
20 |
vectordb = Chroma.from_documents(
|
21 |
-
documents=docs,
|
22 |
embedding=embedding_model,
|
23 |
persist_directory=persist_directory
|
24 |
)
|
|
|
6 |
|
7 |
from langchain.text_splitter import RecursiveCharacterTextSplitter
|
8 |
splitter = RecursiveCharacterTextSplitter(chunk_size=100, chunk_overlap=15,separators=["\n\n", "\n", " ", ""])
|
9 |
+
#docs = splitter.split_documents(dataset)
|
10 |
+
docs = splitter.split_text(str(dataset))
|
11 |
|
12 |
|
13 |
from langchain_community.embeddings import HuggingFaceEmbeddings
|
|
|
18 |
from langchain_community.vectorstores import Chroma
|
19 |
persist_directory = 'docs/chroma/'
|
20 |
vectordb = Chroma.from_documents(
|
21 |
+
documents=[docs],
|
22 |
embedding=embedding_model,
|
23 |
persist_directory=persist_directory
|
24 |
)
|