|
|
|
import gradio as gr |
|
import requests |
|
import json |
|
from datetime import datetime, timedelta |
|
|
|
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" |
|
|
|
MAJOR_COUNTRIES = [ |
|
"United States", "United Kingdom", "Canada", "Australia", "Germany", |
|
"France", "Japan", "South Korea", "China", "India", |
|
"Brazil", "Mexico", "Russia", "Italy", "Spain", |
|
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", |
|
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", |
|
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", |
|
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", |
|
"Hungary", "Greece", "Portugal", "Argentina", "Chile", |
|
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", |
|
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" |
|
] |
|
|
|
def search_serphouse(query, country, page, num_result): |
|
url = "https://api.serphouse.com/serp/live" |
|
|
|
now = datetime.utcnow() |
|
yesterday = now - timedelta(days=1) |
|
date_range = f"{yesterday.strftime('%Y-%m-%d')},{now.strftime('%Y-%m-%d')}" |
|
|
|
payload = { |
|
"data": { |
|
"q": query, |
|
"domain": "google.com", |
|
"loc": country, |
|
"lang": "en", |
|
"device": "desktop", |
|
"serp_type": "news", |
|
"page": str(page), |
|
"verbatim": "1", |
|
"num": str(num_result), |
|
"date_range": date_range |
|
} |
|
} |
|
|
|
headers = { |
|
"accept": "application/json", |
|
"content-type": "application/json", |
|
"authorization": f"Bearer {API_KEY}" |
|
} |
|
|
|
try: |
|
response = requests.post(url, json=payload, headers=headers) |
|
response.raise_for_status() |
|
return response.json() |
|
except requests.RequestException as e: |
|
error_msg = f"Error: {str(e)}" |
|
if response.text: |
|
error_msg += f"\nResponse content: {response.text}" |
|
return {"error": error_msg} |
|
|
|
def format_results_from_raw(results): |
|
try: |
|
debug_info = f"Raw API Response:\n{json.dumps(results, indent=2, ensure_ascii=False)}" |
|
|
|
if isinstance(results, dict) and "error" in results: |
|
return "Error: " + results["error"], debug_info |
|
|
|
if not isinstance(results, dict): |
|
raise ValueError("๊ฒฐ๊ณผ๊ฐ ์ฌ์ ํ์์ด ์๋๋๋ค.") |
|
|
|
|
|
if 'results' in results: |
|
results_content = results['results'] |
|
|
|
if 'news' in results_content: |
|
news_results = results_content['news'] |
|
else: |
|
news_results = [] |
|
else: |
|
news_results = [] |
|
|
|
if not news_results: |
|
return "๊ฒ์ ๊ฒฐ๊ณผ๊ฐ ์์ต๋๋ค.", debug_info |
|
|
|
formatted_articles = "" |
|
for result in news_results: |
|
title = result.get("title", "์ ๋ชฉ ์์") |
|
link = result.get("url", result.get("link", "#")) |
|
snippet = result.get("snippet", "๋ด์ฉ ์์") |
|
channel = result.get("channel", result.get("source", "์ ์ ์์")) |
|
time = result.get("time", result.get("date", "์ ์ ์๋ ์๊ฐ")) |
|
image_url = result.get("img", result.get("thumbnail", "")) |
|
|
|
|
|
if image_url and not image_url.startswith("data:image"): |
|
image_html = f'<img src="{image_url}" alt="Image" style="max-width: 100%; height: auto;">' |
|
else: |
|
image_html = '' |
|
|
|
article_html = f""" |
|
<div style="margin-bottom: 20px; border-bottom: 1px solid #ccc; padding-bottom: 20px;"> |
|
<h3><a href="{link}" target="_blank">{title}</a></h3> |
|
<p><strong>{channel}</strong> - {time}</p> |
|
{image_html} |
|
<p>{snippet}</p> |
|
</div> |
|
""" |
|
formatted_articles += article_html |
|
|
|
return formatted_articles, debug_info |
|
|
|
except Exception as e: |
|
error_message = f"๊ฒฐ๊ณผ ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์: {str(e)}" |
|
debug_info = f"Error: {error_message}\n" |
|
return "Error: " + error_message, debug_info |
|
|
|
def serphouse_search(query, country, page, num_result): |
|
results = search_serphouse(query, country, page, num_result) |
|
formatted_articles, debug_info = format_results_from_raw(results) |
|
return formatted_articles, debug_info |
|
|
|
css = """ |
|
footer { |
|
visibility: hidden; |
|
} |
|
""" |
|
|
|
|
|
with gr.Blocks(css=css, title="24์๊ฐ ์ด๋ด ๋ด์ค ๊ฒ์ ์ธํฐํ์ด์ค") as iface: |
|
gr.Markdown("## 24์๊ฐ ์ด๋ด ๋ด์ค ๊ฒ์ ์ธํฐํ์ด์ค") |
|
gr.Markdown("๊ฒ์์ด๋ฅผ ์
๋ ฅํ๊ณ ๊ตญ๊ฐ๋ฅผ ์ ํํ์ฌ 24์๊ฐ ์ด๋ด์ ๋ด์ค ๊ฒฐ๊ณผ๋ฅผ ๊ฐ์ ธ์ต๋๋ค.") |
|
|
|
with gr.Tab("๊ฒ์"): |
|
with gr.Row(): |
|
query = gr.Textbox(label="๊ฒ์์ด") |
|
country = gr.Dropdown(MAJOR_COUNTRIES, label="๊ตญ๊ฐ", value="South Korea") |
|
with gr.Row(): |
|
page = gr.Slider(1, 10, 1, label="ํ์ด์ง") |
|
num_result = gr.Slider(1, 100, 10, label="๊ฒฐ๊ณผ ์") |
|
|
|
search_button = gr.Button("๊ฒ์") |
|
|
|
with gr.Tab("๋ด์ค ๊ฒฐ๊ณผ"): |
|
news_output = gr.HTML(label="๋ด์ค ๊ฒฐ๊ณผ") |
|
|
|
with gr.Tab("๋๋ฒ๊ทธ ์ ๋ณด"): |
|
debug_output = gr.Textbox(label="๋๋ฒ๊ทธ ์ ๋ณด", lines=10) |
|
|
|
def search_and_display(query, country, page, num_result): |
|
articles, debug_info = serphouse_search(query, country, page, num_result) |
|
return {news_output: articles, debug_output: debug_info} |
|
|
|
search_button.click( |
|
search_and_display, |
|
inputs=[query, country, page, num_result], |
|
outputs=[news_output, debug_output] |
|
) |
|
|
|
iface.launch(auth=("gini", "pick")) |
|
|