|
import gradio as gr |
|
import requests |
|
import json |
|
from datetime import datetime, timedelta |
|
|
|
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" |
|
|
|
MAJOR_COUNTRIES = [ |
|
"United States", "United Kingdom", "Canada", "Australia", "Germany", |
|
"France", "Japan", "South Korea", "China", "India", |
|
"Brazil", "Mexico", "Russia", "Italy", "Spain", |
|
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", |
|
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", |
|
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", |
|
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", |
|
"Hungary", "Greece", "Portugal", "Argentina", "Chile", |
|
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", |
|
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" |
|
] |
|
|
|
def search_serphouse(query, country, page=1, num_result=100): |
|
url = "https://api.serphouse.com/serp/live" |
|
|
|
now = datetime.utcnow() |
|
yesterday = now - timedelta(days=1) |
|
date_range = f"{yesterday.strftime('%Y-%m-%d')},{now.strftime('%Y-%m-%d')}" |
|
|
|
payload = { |
|
"data": { |
|
"q": query, |
|
"domain": "google.com", |
|
"loc": country, |
|
"lang": "en", |
|
"device": "desktop", |
|
"serp_type": "news", |
|
"page": str(page), |
|
"verbatim": "1", |
|
"num": str(num_result), |
|
"date_range": date_range |
|
} |
|
} |
|
|
|
headers = { |
|
"accept": "application/json", |
|
"content-type": "application/json", |
|
"authorization": f"Bearer {API_KEY}" |
|
} |
|
|
|
try: |
|
response = requests.post(url, json=payload, headers=headers) |
|
response.raise_for_status() |
|
return response.json() |
|
except requests.RequestException as e: |
|
error_msg = f"Error: {str(e)}" |
|
if response.text: |
|
error_msg += f"\nResponse content: {response.text}" |
|
return {"error": error_msg} |
|
|
|
def format_results_from_raw(results): |
|
try: |
|
|
|
debug_info = "" |
|
|
|
if isinstance(results, dict) and "error" in results: |
|
return "Error: " + results["error"], "" |
|
|
|
if not isinstance(results, dict): |
|
raise ValueError("๊ฒฐ๊ณผ๊ฐ ์ฌ์ ํ์์ด ์๋๋๋ค.") |
|
|
|
|
|
if 'results' in results: |
|
results_content = results['results'] |
|
if 'results' in results_content: |
|
results_content = results_content['results'] |
|
|
|
if 'news' in results_content: |
|
news_results = results_content['news'] |
|
else: |
|
news_results = [] |
|
else: |
|
news_results = [] |
|
else: |
|
news_results = [] |
|
|
|
if not news_results: |
|
return "๊ฒ์ ๊ฒฐ๊ณผ๊ฐ ์์ต๋๋ค.", "" |
|
|
|
|
|
list_output = "" |
|
|
|
for idx, result in enumerate(news_results, 1): |
|
title = result.get("title", "์ ๋ชฉ ์์") |
|
link = result.get("url", result.get("link", "#")) |
|
snippet = result.get("snippet", "๋ด์ฉ ์์") |
|
channel = result.get("channel", result.get("source", "์ ์ ์์")) |
|
time = result.get("time", result.get("date", "์ ์ ์๋ ์๊ฐ")) |
|
image_url = result.get("img", result.get("thumbnail", "")) |
|
|
|
|
|
if image_url and not image_url.startswith("data:image"): |
|
thumbnail_html = f'<img src="{image_url}" alt="Thumbnail" style="width: 100px; height: auto;">' |
|
else: |
|
thumbnail_html = '' |
|
|
|
|
|
list_item = f""" |
|
<div style="margin-bottom: 20px;"> |
|
<h4>{idx}. <a href="{link}" target="_blank">{title}</a></h4> |
|
<p>{thumbnail_html}</p> |
|
<p>์์ฝ: {snippet}</p> |
|
<p>์ถ์ฒ: {channel} | ์๊ฐ: {time}</p> |
|
<hr> |
|
</div> |
|
""" |
|
list_output += list_item |
|
|
|
return list_output, "" |
|
|
|
except Exception as e: |
|
error_message = f"๊ฒฐ๊ณผ ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์: {str(e)}" |
|
return "Error: " + error_message, "" |
|
|
|
def serphouse_search(query, country): |
|
|
|
page = 1 |
|
num_result = 100 |
|
results = search_serphouse(query, country, page, num_result) |
|
list_output, debug_info = format_results_from_raw(results) |
|
return list_output |
|
|
|
css = """ |
|
footer { |
|
visibility: hidden; |
|
} |
|
/* '๋ด์ค ๊ฒฐ๊ณผ'์ '๋๋ฒ๊ทธ ์ ๋ณด' ํญ ์จ๊ธฐ๊ธฐ */ |
|
#tab-๋ด์ค_๊ฒฐ๊ณผ, #tab-๋๋ฒ๊ทธ_์ ๋ณด { |
|
display: none !important; |
|
} |
|
/* 'ํ์ด์ง'์ '๊ฒฐ๊ณผ ์' ์
๋ ฅ ์์ ์จ๊ธฐ๊ธฐ */ |
|
.slider-container { |
|
display: none !important; |
|
} |
|
""" |
|
|
|
|
|
with gr.Blocks(theme="Nymbo/Nymbo_Theme", css=css, title="NewsAI ์๋น์ค") as iface: |
|
gr.Markdown("๊ฒ์์ด๋ฅผ ์
๋ ฅํ๊ณ ์ํ๋ ๊ตญ๊ฐ๋ฅผ ์ ํํ๋ฉด, ๊ฒ์์ด์ ์ผ์นํ๋ 24์๊ฐ ์ด๋ด ๋ด์ค๋ฅผ ์ต๋ 100๊ฐ ์ถ๋ ฅํฉ๋๋ค.") |
|
|
|
with gr.Tab("๊ฒ์"): |
|
with gr.Row(): |
|
query = gr.Textbox(label="๊ฒ์์ด") |
|
country = gr.Dropdown(MAJOR_COUNTRIES, label="๊ตญ๊ฐ", value="South Korea") |
|
|
|
|
|
|
|
|
|
|
|
search_button = gr.Button("๊ฒ์") |
|
|
|
|
|
|
|
|
|
|
|
with gr.Tab("๋ฆฌ์คํธ"): |
|
list_output = gr.HTML(label="๋ฆฌ์คํธ ๊ฒฐ๊ณผ") |
|
|
|
|
|
|
|
|
|
def search_and_display(query, country): |
|
list_output_text = serphouse_search(query, country) |
|
return {list_output: list_output_text} |
|
|
|
search_button.click( |
|
search_and_display, |
|
inputs=[query, country], |
|
outputs=[list_output] |
|
) |
|
|
|
iface.launch(auth=("gini", "pick")) |
|
|