Spaces:

Makima57
/

query-app

Sleeping

Makima57 commited on Sep 23, 2024

Commit

084f54d

verified ·

1 Parent(s): eea466c

Upload app.py with huggingface_hub

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import streamlit as st
 from googlesearch import search
 import requests
@@ -6,7 +8,7 @@ from bs4 import BeautifulSoup
 # Function to perform Google search and return the first link
 def google_search(query):
     try:
-        query = query + "/t site:https://www.realtor.ca/"
         # Perform the search and get an iterator of results
         search_results = search(query, num_results=10)  # Get up to 10 results
         first_link = next(search_results, None)  # Get the first result
@@ -39,7 +41,8 @@ def scrape_text(webpage_content):
         # Break multi-headlines into a line each
         chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
         # Drop blank lines
-        text = '\n'.join(chunk for chunk in chunks if chunk)
         return text
     except Exception as e:
         st.error(f"Failed to scrape text from webpage content: {e}")
@@ -67,11 +70,12 @@ if st.button("Search"):
                 # Download button for the webpage content
                 st.download_button(
                     label="Download Webpage Content",
-                    data=webpage_content,
-                    file_name="webpage_content.html",
-                    mime="text/html"
                 )
         else:
             st.warning("No results found")
     else:
-        st.error("Please enter a query")

+# app.py
 import streamlit as st
 from googlesearch import search
 import requests
 # Function to perform Google search and return the first link
 def google_search(query):
     try:
+        query = query + "/t site:https://medium.com/"
         # Perform the search and get an iterator of results
         search_results = search(query, num_results=10)  # Get up to 10 results
         first_link = next(search_results, None)  # Get the first result
         # Break multi-headlines into a line each
         chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
         # Drop blank lines
+        text = '
+'.join(chunk for chunk in chunks if chunk)
         return text
     except Exception as e:
         st.error(f"Failed to scrape text from webpage content: {e}")
                 # Download button for the webpage content
                 st.download_button(
                     label="Download Webpage Content",
+                    data=scraped_text,
+                    file_name="webpage_content.txt",
+                    mime="text/plain"
                 )
         else:
             st.warning("No results found")
     else:
+        st.error("Please enter a query")