Spaces:

zliang
/

PDFReadingAssistant

Paused

App Files Files Community

zliang commited on Feb 10

Commit

a2d9aa7

verified ·

1 Parent(s): 8eab150

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -7

app.py CHANGED Viewed

@@ -98,17 +98,13 @@ def summarize_pdf_with_tooltips(_pdf_file_path, num_clusters=10):
 2. Main methodologies used
 3. Important data points
 4. Limitations mentioned
 For any information directly derived from the context excerpts provided below, insert an in-text citation as an HTML tooltip.
 For each citation, use the following HTML format:
 <span class="tooltip" data-tooltip="{full_text}">[{n}]</span>
 Where:
 - {n} is the citation number.
 - {full_text} is the complete excerpt text for that citation.
 Do not provide a separate reference list. Instead, embed the full citation text directly in the tooltip.
 Context Excerpts:
 {contexts}"""
     )
@@ -150,7 +146,7 @@ Context Excerpts:
 @handle_errors
 def qa_pdf(_pdf_file_path, query, num_clusters=5):
     embeddings_model = OpenAIEmbeddings(model="text-embedding-3-small", api_key=openai_api_key)
-    llm = ChatOpenAI(model="gpt-3.5-turbo", api_key=openai_api_key, temperature=0.3)
     prompt = ChatPromptTemplate.from_template(
         """Answer this question: {question}
@@ -190,7 +186,7 @@ def process_pdf(_pdf_file_path):
     scale_factor = 300 / 50  # High-res to low-res ratio
     for page in doc:
-        low_res = page.get_pixmap(dpi=300)
         low_res_img = np.frombuffer(low_res.samples, dtype=np.uint8).reshape(low_res.height, low_res.width, 3)
         results = model.predict(low_res_img)
@@ -378,4 +374,4 @@ st.markdown("""
       width: 300px; /* Adjust width as needed */
     }
 </style>
-""", unsafe_allow_html=True)

 2. Main methodologies used
 3. Important data points
 4. Limitations mentioned
 For any information directly derived from the context excerpts provided below, insert an in-text citation as an HTML tooltip.
 For each citation, use the following HTML format:
 <span class="tooltip" data-tooltip="{full_text}">[{n}]</span>
 Where:
 - {n} is the citation number.
 - {full_text} is the complete excerpt text for that citation.
 Do not provide a separate reference list. Instead, embed the full citation text directly in the tooltip.
 Context Excerpts:
 {contexts}"""
     )
 @handle_errors
 def qa_pdf(_pdf_file_path, query, num_clusters=5):
     embeddings_model = OpenAIEmbeddings(model="text-embedding-3-small", api_key=openai_api_key)
+    llm = ChatOpenAI(model="gpt-4", api_key=openai_api_key, temperature=0.3)
     prompt = ChatPromptTemplate.from_template(
         """Answer this question: {question}
     scale_factor = 300 / 50  # High-res to low-res ratio
     for page in doc:
+        low_res = page.get_pixmap(dpi=50)
         low_res_img = np.frombuffer(low_res.samples, dtype=np.uint8).reshape(low_res.height, low_res.width, 3)
         results = model.predict(low_res_img)
       width: 300px; /* Adjust width as needed */
     }
 </style>
+""", unsafe_allow_html=True)