File size: 4,430 Bytes
09ebcd0
 
eec4d01
efb5f18
09ebcd0
6097fb2
1b298f9
34db24b
 
 
 
 
 
 
 
 
 
 
6097fb2
1b298f9
eec4d01
6097fb2
2efa0ec
eec4d01
 
 
 
 
 
 
 
 
 
 
 
1b298f9
6097fb2
 
eec4d01
 
 
6097fb2
 
eec4d01
6097fb2
 
 
 
 
1b298f9
482bc99
 
 
 
 
 
 
 
 
 
 
 
 
 
6097fb2
482bc99
 
 
 
 
 
 
 
 
 
 
a4f4206
efb5f18
 
482bc99
 
 
 
 
 
 
 
 
 
 
 
 
6097fb2
a4f4206
efb5f18
482bc99
efb5f18
158b524
eec4d01
34db24b
 
eec4d01
6097fb2
68a8b0c
a4f4206
6097fb2
ab30506
6097fb2
34db24b
6097fb2
 
 
ad0f104
efb5f18
a4f4206
 
ad0f104
 
94b1606
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
import gradio as gr
import requests
import json
from datetime import datetime, timedelta

API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"

MAJOR_COUNTRIES = [
    "United States", "United Kingdom", "Canada", "Australia", "Germany", 
    "France", "Japan", "South Korea", "China", "India", 
    "Brazil", "Mexico", "Russia", "Italy", "Spain", 
    "Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", 
    "Finland", "Belgium", "Austria", "New Zealand", "Ireland", 
    "Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", 
    "South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", 
    "Hungary", "Greece", "Portugal", "Argentina", "Chile", 
    "Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", 
    "Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]

def search_serphouse(query, country, verbatim, page, num_result):
    url = "https://api.serphouse.com/serp/live"
    
    payload = {
        "data": {
            "q": query,
            "domain": "google.com",
            "loc": country,
            "lang": "en",
            "device": "desktop",
            "serp_type": "news",
            "page": str(page),
            "verbatim": verbatim,
            "num": str(num_result)
        }
    }
    
    headers = {
        "accept": "application/json",
        "content-type": "application/json",
        "authorization": f"Bearer {API_KEY}"
    }
    
    response = requests.post(url, json=payload, headers=headers)
    
    if response.status_code == 200:
        return response.json()
    else:
        return f"Error: {response.status_code} - {response.text}"

def is_within_24_hours(time_str):
    time_parts = time_str.split()
    if len(time_parts) >= 2:
        try:
            value = int(time_parts[0])
            unit = time_parts[1].lower()
            if unit in ['minute', 'minutes', 'hour', 'hours']:
                return True
            elif unit in ['day', 'days'] and value == 1:
                return True
        except ValueError:
            pass
    return False

def format_results(results):
    html_output = """
    <style>
        .news-container { font-family: Arial, sans-serif; max-width: 800px; margin: 0 auto; }
        .news-item { border: 1px solid #ddd; padding: 15px; margin-bottom: 20px; border-radius: 5px; }
        .news-title { font-size: 18px; color: #1a0dab; text-decoration: none; }
        .news-snippet { color: #545454; margin: 10px 0; }
        .news-meta { font-size: 12px; color: #006621; }
    </style>
    <div class="news-container">
        <h2>Search Results (Last 24 Hours)</h2>
    """
    
    if isinstance(results, dict) and "results" in results:
        news_results = results["results"].get("news", [])
        filtered_results = [result for result in news_results if is_within_24_hours(result.get("time", "").strip())]
        
        if not filtered_results:
            html_output += "<p>No news results found within the last 24 hours.</p>"
        else:
            for result in filtered_results:
                html_output += f"""
                <div class="news-item">
                    <a href="{result.get('url', '#')}" class="news-title">{result.get('title', 'No Title')}</a>
                    <p class="news-snippet">{result.get('snippet', 'No Snippet')}</p>
                    <p class="news-meta">Source: {result.get('channel', 'Unknown')} - {result.get('time', 'Unknown time')}</p>
                </div>
                """
    else:
        html_output += "<p>Unexpected response format or no results found.</p>"
    
    html_output += "</div>"
    return html_output

def serphouse_search(query, country, verbatim, page, num_result):
    verbatim = "1" if verbatim else "0"
    
    results = search_serphouse(query, country, verbatim, page, num_result)
    return format_results(results)

iface = gr.Interface(
    fn=serphouse_search,
    inputs=[
        gr.Textbox(label="Search Query"),
        gr.Dropdown(MAJOR_COUNTRIES, label="Country"),
        gr.Checkbox(label="Verbatim"),
        gr.Slider(1, 10, 1, label="Page"),
        gr.Slider(1, 100, 10, label="Number of Results")
    ],
    outputs="html",
    title="SERPHouse News Search Interface",
    description="Enter your search query and select a country to get news results from the SERPHouse API. Only articles from the last 24 hours will be displayed."
)

iface.launch()