|
import gradio as gr |
|
import requests |
|
import json |
|
from datetime import datetime, timedelta |
|
|
|
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" |
|
|
|
MAJOR_COUNTRIES = [ |
|
"United States", "United Kingdom", "Canada", "Australia", "Germany", |
|
"France", "Japan", "South Korea", "China", "India", |
|
"Brazil", "Mexico", "Russia", "Italy", "Spain", |
|
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", |
|
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", |
|
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", |
|
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", |
|
"Hungary", "Greece", "Portugal", "Argentina", "Chile", |
|
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", |
|
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" |
|
] |
|
|
|
def search_serphouse(query, country, page, num_result): |
|
url = "https://api.serphouse.com/serp/live" |
|
|
|
payload = { |
|
"data": { |
|
"q": query, |
|
"domain": "google.com", |
|
"loc": country, |
|
"lang": "en", |
|
"device": "desktop", |
|
"serp_type": "news", |
|
"page": str(page), |
|
"verbatim": "1", |
|
"num": str(num_result) |
|
} |
|
} |
|
|
|
headers = { |
|
"accept": "application/json", |
|
"content-type": "application/json", |
|
"authorization": f"Bearer {API_KEY}" |
|
} |
|
|
|
try: |
|
response = requests.post(url, json=payload, headers=headers) |
|
response.raise_for_status() |
|
return response.json() |
|
except requests.RequestException as e: |
|
return f"Error: {str(e)}" |
|
|
|
def is_recent_news(time_str): |
|
if not time_str: |
|
return False |
|
time_parts = time_str.lower().split() |
|
if len(time_parts) < 2: |
|
return False |
|
try: |
|
value = int(time_parts[0]) |
|
unit = time_parts[1] |
|
if unit in ['minute', 'minutes', 'hour', 'hours']: |
|
return True |
|
elif unit in ['day', 'days']: |
|
return value <= 1 |
|
except ValueError: |
|
return False |
|
return False |
|
|
|
def format_results(results): |
|
all_results = "## All News Results\n\n" |
|
recent_results = "## Recent News Results (Within 1 Day)\n\n" |
|
debug_info = "## Debug Information\n\n" |
|
|
|
debug_info += f"Raw API Response:\n```json\n{json.dumps(results, indent=2)}\n```\n\n" |
|
|
|
try: |
|
if isinstance(results, dict) and "results" in results and "news" in results["results"]: |
|
news_results = results["results"]["news"] |
|
debug_info += f"Number of news results: {len(news_results)}\n\n" |
|
|
|
for result in news_results: |
|
time_str = result.get("time", "Unknown time") |
|
is_recent = is_recent_news(time_str) |
|
debug_info += f"Article: {result.get('title', 'No Title')}\nTime: {time_str}, Is Recent: {is_recent}\n\n" |
|
|
|
all_results += f""" |
|
### [{result.get('title', 'No Title')}]({result.get('url', '#')}) |
|
|
|
{result.get('snippet', 'No Snippet')} |
|
|
|
**Source:** {result.get('channel', 'Unknown')} - {time_str} |
|
|
|
--- |
|
|
|
""" |
|
if is_recent: |
|
recent_results += f""" |
|
### [{result.get('title', 'No Title')}]({result.get('url', '#')}) |
|
|
|
{result.get('snippet', 'No Snippet')} |
|
|
|
**Source:** {result.get('channel', 'Unknown')} - {time_str} |
|
|
|
--- |
|
|
|
""" |
|
|
|
if recent_results == "## Recent News Results (Within 1 Day)\n\n": |
|
recent_results += "*No recent news results found within 1 day.*\n\n" |
|
else: |
|
all_results += "*No valid news results found in the API response.*\n\n" |
|
recent_results += "*No valid news results found in the API response.*\n\n" |
|
debug_info += "Invalid or unexpected API response structure\n" |
|
except Exception as e: |
|
all_results += f"*Error processing results: {str(e)}*\n\n" |
|
recent_results += f"*Error processing results: {str(e)}*\n\n" |
|
debug_info += f"Exception occurred: {str(e)}\n" |
|
|
|
return all_results, recent_results, debug_info |
|
|
|
def serphouse_search(query, country, page, num_result): |
|
results = search_serphouse(query, country, page, num_result) |
|
all_results, recent_results, debug_info = format_results(results) |
|
return all_results, recent_results, debug_info |
|
|
|
css = """ |
|
footer { |
|
visibility: hidden; |
|
} |
|
""" |
|
|
|
iface = gr.Interface( |
|
fn=serphouse_search, |
|
inputs=[ |
|
gr.Textbox(label="Search Query"), |
|
gr.Dropdown(MAJOR_COUNTRIES, label="Country"), |
|
gr.Slider(1, 10, 1, label="Page"), |
|
gr.Slider(1, 100, 10, label="Number of Results") |
|
], |
|
outputs=[ |
|
gr.Markdown(label="All Results"), |
|
gr.Markdown(label="Recent Results (Within 1 Day)"), |
|
gr.Markdown(label="Debug Information") |
|
], |
|
title="SERPHouse News Search Interface", |
|
description="Enter your search query and select a country to get news results from the SERPHouse API. Recent results (within 1 day) are shown separately.", |
|
theme="Nymbo/Nymbo_Theme", |
|
css=css |
|
) |
|
|
|
iface.launch() |
|
|