M17idd commited on
Commit
a0f7add
·
verified ·
1 Parent(s): c0d763b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -9
app.py CHANGED
@@ -82,21 +82,23 @@ class TogetherEmbeddings(Embeddings):
82
  @st.cache_resource
83
  def get_pdf_index():
84
  with st.spinner('📄 در حال پردازش فایل PDF...'):
85
- loader = PyPDFLoader('test1.pdf')
86
- documents = loader.load()
 
 
 
87
 
88
- text_splitter = RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=0)
89
- texts = text_splitter.split_documents(documents)
90
 
91
- embeddings = HuggingFaceEmbeddings(
92
- model_name="HooshvareLab/bert-fa-zwnj-base"
93
- )
94
 
95
- index = FAISS.from_documents(texts, embeddings)
96
- return index
 
 
 
97
 
98
  index = get_pdf_index()
99
 
 
100
  llm = HuggingFaceHub(
101
  repo_id="HooshvareLab/bert-fa-zwnj-base",
102
  model_kwargs={"temperature": 0.7, "max_new_tokens": 512}
 
82
  @st.cache_resource
83
  def get_pdf_index():
84
  with st.spinner('📄 در حال پردازش فایل PDF...'):
85
+ loader = [PyPDFLoader('test1.pdf')]
86
+ embeddings = TogetherEmbeddings(
87
+ model_name="togethercomputer/m2-bert-80M-8k-retrieval",
88
+ api_key="0291f33aee03412a47fa5d8e562e515182dcc5d9aac5a7fb5eefdd1759005979"
89
+
90
 
 
 
91
 
 
 
 
92
 
93
+ )
94
+ return VectorstoreIndexCreator(
95
+ embedding=embeddings,
96
+ text_splitter=RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=0)
97
+ ).from_loaders(loader)
98
 
99
  index = get_pdf_index()
100
 
101
+
102
  llm = HuggingFaceHub(
103
  repo_id="HooshvareLab/bert-fa-zwnj-base",
104
  model_kwargs={"temperature": 0.7, "max_new_tokens": 512}