Spaces:
Building
Building
import gradio as gr | |
import requests | |
import json | |
from datetime import datetime, timedelta | |
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" | |
MAJOR_COUNTRIES = [ | |
"United States", "United Kingdom", "Canada", "Australia", "Germany", | |
"France", "Japan", "South Korea", "China", "India", | |
"Brazil", "Mexico", "Russia", "Italy", "Spain", | |
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", | |
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", | |
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", | |
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", | |
"Hungary", "Greece", "Portugal", "Argentina", "Chile", | |
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", | |
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" | |
] | |
def search_serphouse(query, country, page, num_result): | |
url = "https://api.serphouse.com/serp/live" | |
payload = { | |
"data": { | |
"q": query, | |
"domain": "google.com", | |
"loc": country, | |
"lang": "en", | |
"device": "desktop", | |
"serp_type": "news", | |
"page": str(page), | |
"verbatim": "1", | |
"num": str(num_result) | |
} | |
} | |
headers = { | |
"accept": "application/json", | |
"content-type": "application/json", | |
"authorization": f"Bearer {API_KEY}" | |
} | |
try: | |
response = requests.post(url, json=payload, headers=headers) | |
response.raise_for_status() | |
return response.json() | |
except requests.RequestException as e: | |
return f"Error: {str(e)}" | |
def is_recent_news(time_str): | |
if not time_str: | |
return False | |
time_parts = time_str.lower().split() | |
if len(time_parts) < 2: | |
return False | |
try: | |
value = int(time_parts[0]) | |
unit = time_parts[1] | |
if unit in ['minute', 'minutes', 'hour', 'hours']: | |
return True | |
elif unit in ['day', 'days']: | |
return value <= 1 | |
except ValueError: | |
return False | |
return False | |
def format_results(results): | |
all_results = "## All News Results\n\n" | |
recent_results = "## Recent News Results (Within 1 Day)\n\n" | |
debug_info = "## Debug Information\n\n" | |
debug_info += f"Raw API Response:\n```json\n{json.dumps(results, indent=2)}\n```\n\n" | |
try: | |
if not isinstance(results, dict): | |
raise ValueError("Results is not a dictionary") | |
if "results" not in results: | |
raise ValueError("No 'results' key in the response") | |
if "news" not in results["results"]: | |
raise ValueError("No 'news' key in results") | |
news_results = results["results"]["news"] | |
debug_info += f"Number of news results: {len(news_results)}\n\n" | |
for result in news_results: | |
title = result.get("title", "No Title") | |
url = result.get("url", "#") | |
snippet = result.get("snippet", "No Snippet") | |
channel = result.get("channel", "Unknown") | |
time_str = result.get("time", "Unknown time") | |
is_recent = is_recent_news(time_str) | |
debug_info += f"Article: {title}\nTime: {time_str}, Is Recent: {is_recent}\n\n" | |
article_info = f""" | |
### [{title}]({url}) | |
{snippet} | |
**Source:** {channel} - {time_str} | |
--- | |
""" | |
all_results += article_info | |
if is_recent: | |
recent_results += article_info | |
if recent_results == "## Recent News Results (Within 1 Day)\n\n": | |
recent_results += "*No recent news results found within 1 day.*\n\n" | |
except Exception as e: | |
error_message = f"Error processing results: {str(e)}" | |
debug_info += error_message + "\n" | |
all_results = error_message + "\n\n" | |
recent_results = error_message + "\n\n" | |
return all_results, recent_results, debug_info | |
def serphouse_search(query, country, page, num_result): | |
results = search_serphouse(query, country, page, num_result) | |
all_results, recent_results, debug_info = format_results(results) | |
return all_results, recent_results, debug_info | |
css = """ | |
footer { | |
visibility: hidden; | |
} | |
""" | |
iface = gr.Interface( | |
fn=serphouse_search, | |
inputs=[ | |
gr.Textbox(label="Search Query"), | |
gr.Dropdown(MAJOR_COUNTRIES, label="Country"), | |
gr.Slider(1, 10, 1, label="Page"), | |
gr.Slider(1, 100, 10, label="Number of Results") | |
], | |
outputs=[ | |
gr.Markdown(label="All Results"), | |
gr.Markdown(label="Recent Results (Within 1 Day)"), | |
gr.Markdown(label="Debug Information") | |
], | |
title="SERPHouse News Search Interface", | |
description="Enter your search query and select a country to get news results from the SERPHouse API. Recent results (within 1 day) are shown separately.", | |
theme="Nymbo/Nymbo_Theme", | |
css=css | |
) | |
iface.launch() | |