File size: 4,839 Bytes
09ebcd0
 
eec4d01
efb5f18
09ebcd0
6097fb2
1b298f9
34db24b
 
 
 
 
 
 
 
 
 
 
6097fb2
1b298f9
eec4d01
6097fb2
2efa0ec
eec4d01
 
 
 
 
 
 
 
 
 
 
 
1b298f9
6097fb2
 
eec4d01
 
 
6097fb2
 
eec4d01
6097fb2
 
 
 
 
1b298f9
482bc99
 
 
 
 
 
 
 
2001e6e
482bc99
 
 
 
 
6097fb2
482bc99
 
 
2001e6e
 
 
 
 
 
482bc99
 
2001e6e
482bc99
a4f4206
2001e6e
 
 
 
 
 
482bc99
2001e6e
 
 
 
 
 
 
 
 
 
efb5f18
482bc99
efb5f18
158b524
eec4d01
34db24b
 
eec4d01
6097fb2
68a8b0c
2001e6e
 
 
 
 
 
 
 
6097fb2
ab30506
6097fb2
34db24b
6097fb2
 
 
ad0f104
efb5f18
a4f4206
 
ad0f104
 
94b1606
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
import gradio as gr
import requests
import json
from datetime import datetime, timedelta

API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"

MAJOR_COUNTRIES = [
    "United States", "United Kingdom", "Canada", "Australia", "Germany", 
    "France", "Japan", "South Korea", "China", "India", 
    "Brazil", "Mexico", "Russia", "Italy", "Spain", 
    "Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", 
    "Finland", "Belgium", "Austria", "New Zealand", "Ireland", 
    "Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", 
    "South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", 
    "Hungary", "Greece", "Portugal", "Argentina", "Chile", 
    "Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", 
    "Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]

def search_serphouse(query, country, verbatim, page, num_result):
    url = "https://api.serphouse.com/serp/live"
    
    payload = {
        "data": {
            "q": query,
            "domain": "google.com",
            "loc": country,
            "lang": "en",
            "device": "desktop",
            "serp_type": "news",
            "page": str(page),
            "verbatim": verbatim,
            "num": str(num_result)
        }
    }
    
    headers = {
        "accept": "application/json",
        "content-type": "application/json",
        "authorization": f"Bearer {API_KEY}"
    }
    
    response = requests.post(url, json=payload, headers=headers)
    
    if response.status_code == 200:
        return response.json()
    else:
        return f"Error: {response.status_code} - {response.text}"

def is_within_24_hours(time_str):
    time_parts = time_str.split()
    if len(time_parts) >= 2:
        try:
            value = int(time_parts[0])
            unit = time_parts[1].lower()
            if unit in ['minute', 'minutes', 'hour', 'hours']:
                return True
            elif unit == 'day' and value == 1:
                return True
        except ValueError:
            pass
    return False

def format_results(results):
    html_output = """
    <style>
        .news-container { font-family: Arial, sans-serif; max-width: 800px; margin: 0 auto; }
        .news-item { background-color: #f9f9f9; border: 1px solid #ddd; padding: 20px; margin-bottom: 20px; border-radius: 8px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }
        .news-title { font-size: 20px; color: #1a0dab; text-decoration: none; font-weight: bold; }
        .news-title:hover { text-decoration: underline; }
        .news-snippet { color: #545454; margin: 15px 0; line-height: 1.4; }
        .news-meta { font-size: 14px; color: #006621; }
        .no-results { text-align: center; color: #666; font-style: italic; }
    </style>
    <div class="news-container">
        <h2 style="text-align: center; color: #333;">Search Results (Last 24 Hours)</h2>
    """
    
    if isinstance(results, dict) and "results" in results:
        news_results = results["results"].get("news", [])
        filtered_results = [result for result in news_results if is_within_24_hours(result.get("time", "").strip())]
        
        if not filtered_results:
            html_output += '<p class="no-results">No news results found within the last 24 hours.</p>'
        else:
            for result in filtered_results:
                html_output += f"""
                <div class="news-item">
                    <a href="{result.get('url', '#')}" class="news-title" target="_blank">{result.get('title', 'No Title')}</a>
                    <p class="news-snippet">{result.get('snippet', 'No Snippet')}</p>
                    <p class="news-meta">Source: {result.get('channel', 'Unknown')} - {result.get('time', 'Unknown time')}</p>
                </div>
                """
    else:
        html_output += '<p class="no-results">No results found or unexpected response format.</p>'
    
    html_output += "</div>"
    return html_output

def serphouse_search(query, country, verbatim, page, num_result):
    verbatim = "1" if verbatim else "0"
    
    results = search_serphouse(query, country, verbatim, page, num_result)
    return format_results(results)

css = """
footer {
    visibility: hidden;
}
"""


iface = gr.Interface(theme="Nymbo/Nymbo_Theme", css=css,
    fn=serphouse_search,
    inputs=[
        gr.Textbox(label="Search Query"),
        gr.Dropdown(MAJOR_COUNTRIES, label="Country"),
        gr.Checkbox(label="Verbatim"),
        gr.Slider(1, 10, 1, label="Page"),
        gr.Slider(1, 100, 10, label="Number of Results")
    ],
    outputs="html",
    title="SERPHouse News Search Interface",
    description="Enter your search query and select a country to get news results from the SERPHouse API. Only articles from the last 24 hours will be displayed."
)

iface.launch()