File size: 4,560 Bytes
09ebcd0 eec4d01 efb5f18 09ebcd0 6097fb2 1b298f9 34db24b 6097fb2 1b298f9 8415ea5 6097fb2 2efa0ec eec4d01 8415ea5 eec4d01 1b298f9 6097fb2 eec4d01 6097fb2 ba53ac8 6097fb2 ba53ac8 1b298f9 a31c3ed 8415ea5 d0b4b99 8415ea5 482bc99 6097fb2 d0b4b99 a4f4206 ba53ac8 8415ea5 ba53ac8 d0b4b99 c5cb552 d0b4b99 482bc99 d0b4b99 ba53ac8 d0b4b99 efb5f18 d0b4b99 158b524 8415ea5 d0b4b99 68a8b0c 43da967 ba53ac8 6097fb2 ab30506 6097fb2 43da967 ad0f104 d0b4b99 43da967 d0b4b99 43da967 ad0f104 43da967 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 |
import gradio as gr
import requests
import json
from datetime import datetime, timedelta
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"
MAJOR_COUNTRIES = [
"United States", "United Kingdom", "Canada", "Australia", "Germany",
"France", "Japan", "South Korea", "China", "India",
"Brazil", "Mexico", "Russia", "Italy", "Spain",
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark",
"Finland", "Belgium", "Austria", "New Zealand", "Ireland",
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia",
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic",
"Hungary", "Greece", "Portugal", "Argentina", "Chile",
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia",
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]
def search_serphouse(query, country, page, num_result):
url = "https://api.serphouse.com/serp/live"
payload = {
"data": {
"q": query,
"domain": "google.com",
"loc": country,
"lang": "en",
"device": "desktop",
"serp_type": "news",
"page": str(page),
"verbatim": "1",
"num": str(num_result)
}
}
headers = {
"accept": "application/json",
"content-type": "application/json",
"authorization": f"Bearer {API_KEY}"
}
try:
response = requests.post(url, json=payload, headers=headers)
response.raise_for_status()
return response.json()
except requests.RequestException as e:
return f"Error: {str(e)}"
def is_recent_news(time_str):
if not time_str:
return False
time_parts = time_str.lower().split()
if len(time_parts) < 2:
return False
try:
value = int(time_parts[0])
unit = time_parts[1]
if unit in ['minute', 'minutes', 'hour', 'hours']:
return True
elif unit == 'day':
return value < 1
except ValueError:
return False
return False
def format_results(results):
all_results = "## All News Results\n\n"
recent_results = "## Recent News Results (Within 1 Day)\n\n"
try:
if isinstance(results, dict) and "results" in results and "news" in results["results"]:
news_results = results["results"]["news"]
for result in news_results:
all_results += f"""
### [{result.get('title', 'No Title')}]({result.get('url', '#')})
{result.get('snippet', 'No Snippet')}
**Source:** {result.get('channel', 'Unknown')} - {result.get('time', 'Unknown time')}
---
"""
if is_recent_news(result.get("time", "")):
recent_results += f"""
### [{result.get('title', 'No Title')}]({result.get('url', '#')})
{result.get('snippet', 'No Snippet')}
**Source:** {result.get('channel', 'Unknown')} - {result.get('time', 'Unknown time')}
---
"""
if recent_results == "## Recent News Results (Within 1 Day)\n\n":
recent_results += "*No recent news results found within 1 day.*\n\n"
else:
all_results += "*No valid news results found in the API response.*\n\n"
recent_results += "*No valid news results found in the API response.*\n\n"
except Exception as e:
all_results += f"*Error processing results: {str(e)}*\n\n"
recent_results += f"*Error processing results: {str(e)}*\n\n"
return all_results, recent_results
def serphouse_search(query, country, page, num_result):
results = search_serphouse(query, country, page, num_result)
all_results, recent_results = format_results(results)
return f"Raw Results:\n\n```json\n{json.dumps(results, indent=2)}\n```\n\n{all_results}", recent_results
css = """
footer {
visibility: hidden;
}
"""
iface = gr.Interface(
fn=serphouse_search,
inputs=[
gr.Textbox(label="Search Query"),
gr.Dropdown(MAJOR_COUNTRIES, label="Country"),
gr.Slider(1, 10, 1, label="Page"),
gr.Slider(1, 100, 10, label="Number of Results")
],
outputs=[
gr.Textbox(label="All Results", lines=20),
gr.Markdown(label="Recent Results (Within 1 Day)")
],
title="SERPHouse News Search Interface",
description="Enter your search query and select a country to get news results from the SERPHouse API. Recent results (within 1 day) are shown separately.",
theme="Nymbo/Nymbo_Theme",
css=css
)
iface.launch() |