Spaces:
Running
Running
File size: 5,695 Bytes
09ebcd0 eec4d01 efb5f18 09ebcd0 6097fb2 1b298f9 34db24b 6097fb2 1b298f9 8415ea5 6097fb2 2efa0ec eec4d01 8415ea5 eec4d01 1b298f9 6097fb2 eec4d01 6097fb2 ba53ac8 6097fb2 ba53ac8 1b298f9 a31c3ed 73ed8f5 8415ea5 73ed8f5 8415ea5 73ed8f5 8415ea5 73ed8f5 8415ea5 73ed8f5 8415ea5 73ed8f5 8415ea5 73ed8f5 482bc99 6097fb2 d0b4b99 ae814df a4f4206 73ed8f5 ba53ac8 8415ea5 73ed8f5 ba53ac8 d0b4b99 ae814df 73ed8f5 ae814df d0b4b99 c5cb552 ae814df c5cb552 ae814df d0b4b99 ae814df d0b4b99 482bc99 d0b4b99 73ed8f5 ba53ac8 d0b4b99 73ed8f5 efb5f18 ae814df 158b524 8415ea5 ae814df 73ed8f5 68a8b0c 43da967 ba53ac8 6097fb2 ab30506 6097fb2 43da967 ad0f104 d0b4b99 73ed8f5 ae814df d0b4b99 43da967 d0b4b99 43da967 ad0f104 43da967 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 |
import gradio as gr
import requests
import json
from datetime import datetime, timedelta
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"
MAJOR_COUNTRIES = [
"United States", "United Kingdom", "Canada", "Australia", "Germany",
"France", "Japan", "South Korea", "China", "India",
"Brazil", "Mexico", "Russia", "Italy", "Spain",
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark",
"Finland", "Belgium", "Austria", "New Zealand", "Ireland",
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia",
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic",
"Hungary", "Greece", "Portugal", "Argentina", "Chile",
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia",
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]
def search_serphouse(query, country, page, num_result):
url = "https://api.serphouse.com/serp/live"
payload = {
"data": {
"q": query,
"domain": "google.com",
"loc": country,
"lang": "en",
"device": "desktop",
"serp_type": "news",
"page": str(page),
"verbatim": "1",
"num": str(num_result)
}
}
headers = {
"accept": "application/json",
"content-type": "application/json",
"authorization": f"Bearer {API_KEY}"
}
try:
response = requests.post(url, json=payload, headers=headers)
response.raise_for_status()
return response.json()
except requests.RequestException as e:
return f"Error: {str(e)}"
def is_recent_news(time_str):
debug_info = f"Checking time: {time_str}\n"
if not time_str:
debug_info += "Time string is empty\n"
return False, debug_info
time_parts = time_str.lower().split()
debug_info += f"Time parts: {time_parts}\n"
if len(time_parts) < 2:
debug_info += "Time parts less than 2\n"
return False, debug_info
try:
value = int(time_parts[0])
unit = time_parts[1]
debug_info += f"Value: {value}, Unit: {unit}\n"
if unit in ['minute', 'minutes', 'hour', 'hours']:
debug_info += "Within minutes or hours\n"
return True, debug_info
elif unit in ['day', 'days']:
is_recent = value <= 1
debug_info += f"Within days, is recent: {is_recent}\n"
return is_recent, debug_info
else:
debug_info += f"Unknown unit: {unit}\n"
return False, debug_info
except ValueError:
debug_info += f"ValueError when parsing: {time_parts[0]}\n"
return False, debug_info
def format_results(results):
all_results = "## All News Results\n\n"
recent_results = "## Recent News Results (Within 1 Day)\n\n"
debug_info = "## Debug Information\n\n"
debug_info += f"Raw API Response:\n```json\n{json.dumps(results, indent=2)}\n```\n\n"
try:
if isinstance(results, dict) and "results" in results and "news" in results["results"]:
news_results = results["results"]["news"]
debug_info += f"Number of news results: {len(news_results)}\n\n"
for result in news_results:
time_str = result.get("time", "Unknown time")
is_recent, time_debug = is_recent_news(time_str)
debug_info += f"Article: {result.get('title', 'No Title')}\n{time_debug}\n"
all_results += f"""
### [{result.get('title', 'No Title')}]({result.get('url', '#')})
{result.get('snippet', 'No Snippet')}
**Source:** {result.get('channel', 'Unknown')} - {time_str}
---
"""
if is_recent:
recent_results += f"""
### [{result.get('title', 'No Title')}]({result.get('url', '#')})
{result.get('snippet', 'No Snippet')}
**Source:** {result.get('channel', 'Unknown')} - {time_str}
---
"""
if recent_results == "## Recent News Results (Within 1 Day)\n\n":
recent_results += "*No recent news results found within 1 day.*\n\n"
else:
all_results += "*No valid news results found in the API response.*\n\n"
recent_results += "*No valid news results found in the API response.*\n\n"
debug_info += "Invalid or unexpected API response structure\n"
except Exception as e:
all_results += f"*Error processing results: {str(e)}*\n\n"
recent_results += f"*Error processing results: {str(e)}*\n\n"
debug_info += f"Exception occurred: {str(e)}\n"
return all_results, recent_results, debug_info
def serphouse_search(query, country, page, num_result):
results = search_serphouse(query, country, page, num_result)
all_results, recent_results, debug_info = format_results(results)
return all_results, recent_results, debug_info
css = """
footer {
visibility: hidden;
}
"""
iface = gr.Interface(
fn=serphouse_search,
inputs=[
gr.Textbox(label="Search Query"),
gr.Dropdown(MAJOR_COUNTRIES, label="Country"),
gr.Slider(1, 10, 1, label="Page"),
gr.Slider(1, 100, 10, label="Number of Results")
],
outputs=[
gr.Markdown(label="All Results"),
gr.Markdown(label="Recent Results (Within 1 Day)"),
gr.Markdown(label="Debug Information")
],
title="SERPHouse News Search Interface",
description="Enter your search query and select a country to get news results from the SERPHouse API. Recent results (within 1 day) are shown separately.",
theme="Nymbo/Nymbo_Theme",
css=css
)
iface.launch() |