M17idd commited on
Commit
1d4b774
·
verified ·
1 Parent(s): bc3930f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +15 -12
app.py CHANGED
@@ -81,22 +81,25 @@ class TogetherEmbeddings(Embeddings):
81
  @st.cache_resource
82
  def get_pdf_index():
83
  with st.spinner('📄 در حال پردازش فایل PDF...'):
84
- loader = [PyPDFLoader('test1.pdf')]
85
- embeddings = TogetherEmbeddings(
86
- model_name="togethercomputer/m2-bert-80M-8k-retrieval",
87
- api_key="0291f33aee03412a47fa5d8e562e515182dcc5d9aac5a7fb5eefdd1759005979"
 
 
 
 
88
  )
89
- return VectorstoreIndexCreator(
90
- embedding=embeddings,
91
- text_splitter=RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=0)
92
- ).from_loaders(loader)
93
 
94
  index = get_pdf_index()
95
 
96
- llm = ChatOpenAI(
97
- base_url="https://api.together.xyz/v1",
98
- api_key='0291f33aee03412a47fa5d8e562e515182dcc5d9aac5a7fb5eefdd1759005979',
99
- model="meta-llama/Llama-3.3-70B-Instruct-Turbo-Free"
100
  )
101
 
102
  chain = RetrievalQA.from_chain_type(
 
81
  @st.cache_resource
82
  def get_pdf_index():
83
  with st.spinner('📄 در حال پردازش فایل PDF...'):
84
+ loader = PyPDFLoader('test1.pdf')
85
+ documents = loader.load()
86
+
87
+ text_splitter = RecursiveCharacterTextSplitter(chunk_size=300, chunk_overlap=0)
88
+ texts = text_splitter.split_documents(documents)
89
+
90
+ embeddings = HuggingFaceEmbeddings(
91
+ model_name="sentence-transformers/all-MiniLM-L6-v2"
92
  )
93
+
94
+ index = FAISS.from_documents(texts, embeddings)
95
+ return index
 
96
 
97
  index = get_pdf_index()
98
 
99
+ llm = HuggingFaceHub(
100
+ repo_id="HuggingFaceH4/zephyr-7b-alpha", # یا مدل دلخواهت مثل llama یا mistral
101
+ model_kwargs={"temperature": 0.7, "max_new_tokens": 512},
102
+ huggingfacehub_api_token="توکن شما"
103
  )
104
 
105
  chain = RetrievalQA.from_chain_type(