|
import gradio as gr |
|
import requests |
|
import json |
|
from datetime import datetime, timedelta |
|
|
|
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" |
|
|
|
MAJOR_COUNTRIES = [ |
|
"United States", "United Kingdom", "Canada", "Australia", "Germany", |
|
"France", "Japan", "South Korea", "China", "India", |
|
"Brazil", "Mexico", "Russia", "Italy", "Spain", |
|
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", |
|
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", |
|
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", |
|
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", |
|
"Hungary", "Greece", "Portugal", "Argentina", "Chile", |
|
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", |
|
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" |
|
] |
|
|
|
def search_serphouse(query, country, page, num_result): |
|
url = "https://api.serphouse.com/serp/live" |
|
|
|
payload = { |
|
"data": { |
|
"q": query, |
|
"domain": "google.com", |
|
"loc": country, |
|
"lang": "en", |
|
"device": "desktop", |
|
"serp_type": "news", |
|
"page": str(page), |
|
"verbatim": "1", |
|
"num": str(num_result) |
|
} |
|
} |
|
|
|
headers = { |
|
"accept": "application/json", |
|
"content-type": "application/json", |
|
"authorization": f"Bearer {API_KEY}" |
|
} |
|
|
|
try: |
|
response = requests.post(url, json=payload, headers=headers) |
|
response.raise_for_status() |
|
return response.json() |
|
except requests.RequestException as e: |
|
return f"Error: {str(e)}" |
|
|
|
def is_recent_news(time_str): |
|
if not time_str: |
|
return False |
|
time_parts = time_str.lower().split() |
|
if len(time_parts) < 2: |
|
return False |
|
try: |
|
value = int(time_parts[0]) |
|
unit = time_parts[1] |
|
if unit in ['minute', 'minutes', 'hour', 'hours']: |
|
return True |
|
elif unit in ['day', 'days']: |
|
return value <= 1 |
|
except ValueError: |
|
return False |
|
return False |
|
|
|
def format_results(results): |
|
all_results = "## All News Results\n\n" |
|
recent_results = "## Recent News Results (Within 1 Day)\n\n" |
|
debug_info = "## Debug Information\n\n" |
|
|
|
debug_info += f"Raw API Response:\n```json\n{json.dumps(results, indent=2)}\n```\n\n" |
|
|
|
try: |
|
if not isinstance(results, dict): |
|
raise ValueError("Results is not a dictionary") |
|
|
|
if "results" not in results: |
|
raise ValueError("No 'results' key in the response") |
|
|
|
if "news" not in results["results"]: |
|
raise ValueError("No 'news' key in results") |
|
|
|
news_results = results["results"]["news"] |
|
debug_info += f"Number of news results: {len(news_results)}\n\n" |
|
|
|
for result in news_results: |
|
title = result.get("title", "No Title") |
|
url = result.get("url", "#") |
|
snippet = result.get("snippet", "No Snippet") |
|
channel = result.get("channel", "Unknown") |
|
time_str = result.get("time", "Unknown time") |
|
|
|
is_recent = is_recent_news(time_str) |
|
debug_info += f"Article: {title}\nTime: {time_str}, Is Recent: {is_recent}\n\n" |
|
|
|
article_info = f""" |
|
### [{title}]({url}) |
|
|
|
{snippet} |
|
|
|
**Source:** {channel} - {time_str} |
|
|
|
--- |
|
|
|
""" |
|
all_results += article_info |
|
if is_recent: |
|
recent_results += article_info |
|
|
|
if recent_results == "## Recent News Results (Within 1 Day)\n\n": |
|
recent_results += "*No recent news results found within 1 day.*\n\n" |
|
|
|
except Exception as e: |
|
error_message = f"Error processing results: {str(e)}" |
|
debug_info += error_message + "\n" |
|
all_results = error_message + "\n\n" |
|
recent_results = error_message + "\n\n" |
|
|
|
return all_results, recent_results, debug_info |
|
|
|
def serphouse_search(query, country, page, num_result): |
|
results = search_serphouse(query, country, page, num_result) |
|
all_results, recent_results, debug_info = format_results(results) |
|
return all_results, recent_results, debug_info |
|
|
|
css = """ |
|
footer { |
|
visibility: hidden; |
|
} |
|
""" |
|
|
|
|
|
iface = gr.Interface( |
|
fn=serphouse_search, |
|
inputs=[ |
|
gr.Textbox(label="Search Query"), |
|
gr.Dropdown(MAJOR_COUNTRIES, label="Country"), |
|
gr.Slider(1, 10, 1, label="Page"), |
|
gr.Slider(1, 100, 10, label="Number of Results") |
|
], |
|
outputs=[ |
|
gr.Markdown(label="All Results"), |
|
gr.Markdown(label="Recent Results (Within 1 Day)"), |
|
gr.Markdown(label="Debug Information") |
|
], |
|
title="SERPHouse News Search Interface", |
|
description="Enter your search query and select a country to get news results from the SERPHouse API. Recent results (within 1 day) are shown separately.", |
|
theme="Nymbo/Nymbo_Theme", |
|
css=css |
|
) |
|
|
|
iface.launch() |
|
|