Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import gradio as gr | |
import requests | |
import json | |
from datetime import datetime, timedelta | |
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6" | |
MAJOR_COUNTRIES = [ | |
"United States", "United Kingdom", "Canada", "Australia", "Germany", | |
"France", "Japan", "South Korea", "China", "India", | |
"Brazil", "Mexico", "Russia", "Italy", "Spain", | |
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark", | |
"Finland", "Belgium", "Austria", "New Zealand", "Ireland", | |
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia", | |
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic", | |
"Hungary", "Greece", "Portugal", "Argentina", "Chile", | |
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia", | |
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh" | |
] | |
def search_serphouse(query, country, page=1, num_result=100): | |
url = "https://api.serphouse.com/serp/live" | |
now = datetime.utcnow() | |
yesterday = now - timedelta(days=1) | |
date_range = f"{yesterday.strftime('%Y-%m-%d')},{now.strftime('%Y-%m-%d')}" | |
payload = { | |
"data": { | |
"q": query, | |
"domain": "google.com", | |
"loc": country, | |
"lang": "en", | |
"device": "desktop", | |
"serp_type": "news", | |
"page": str(page), | |
"verbatim": "1", | |
"num": str(num_result), | |
"date_range": date_range | |
} | |
} | |
headers = { | |
"accept": "application/json", | |
"content-type": "application/json", | |
"authorization": f"Bearer {API_KEY}" | |
} | |
try: | |
response = requests.post(url, json=payload, headers=headers) | |
response.raise_for_status() | |
return response.json() | |
except requests.RequestException as e: | |
error_msg = f"Error: {str(e)}" | |
if response.text: | |
error_msg += f"\nResponse content: {response.text}" | |
return {"error": error_msg} | |
def format_results_from_raw(results): | |
try: | |
# ๋๋ฒ๊ทธ ์ ๋ณด ์๋ต | |
debug_info = "" | |
if isinstance(results, dict) and "error" in results: | |
return "Error: " + results["error"], "" | |
if not isinstance(results, dict): | |
raise ValueError("๊ฒฐ๊ณผ๊ฐ ์ฌ์ ํ์์ด ์๋๋๋ค.") | |
# 'results' ํค ๋ด๋ถ์ ๊ตฌ์กฐ ํ์ธ (์ค์ฒฉ๋ 'results' ์ฒ๋ฆฌ) | |
if 'results' in results: | |
results_content = results['results'] | |
if 'results' in results_content: | |
results_content = results_content['results'] | |
# 'news' ํค ํ์ธ | |
if 'news' in results_content: | |
news_results = results_content['news'] | |
else: | |
news_results = [] | |
else: | |
news_results = [] | |
else: | |
news_results = [] | |
if not news_results: | |
return "๊ฒ์ ๊ฒฐ๊ณผ๊ฐ ์์ต๋๋ค.", "" | |
# ๋ด์ค ๊ฒฐ๊ณผ๋ฅผ ๋ฆฌ์คํธ ํํ๋ก ํฌ๋งทํ (์ด๋ฏธ์ง ์ธ๋ค์ผ ํฌํจ) | |
list_output = "" | |
for idx, result in enumerate(news_results, 1): | |
title = result.get("title", "์ ๋ชฉ ์์") | |
link = result.get("url", result.get("link", "#")) | |
snippet = result.get("snippet", "๋ด์ฉ ์์") | |
channel = result.get("channel", result.get("source", "์ ์ ์์")) | |
time = result.get("time", result.get("date", "์ ์ ์๋ ์๊ฐ")) | |
image_url = result.get("img", result.get("thumbnail", "")) | |
# base64๋ก ์ธ์ฝ๋ฉ๋ ์ด๋ฏธ์ง๋ฅผ ์ฒ๋ฆฌํ์ง ์์ | |
if image_url and not image_url.startswith("data:image"): | |
thumbnail_html = f'<img src="{image_url}" alt="Thumbnail" style="width: 100px; height: auto;">' | |
else: | |
thumbnail_html = '' | |
# ๋ฆฌ์คํธ ํ์์ ๊ธฐ์ฌ (์ด๋ฏธ์ง ์ธ๋ค์ผ ํฌํจ) | |
list_item = f""" | |
<div style="margin-bottom: 20px;"> | |
<h4>{idx}. <a href="{link}" target="_blank">{title}</a></h4> | |
<p>{thumbnail_html}</p> | |
<p>์์ฝ: {snippet}</p> | |
<p>์ถ์ฒ: {channel} | ์๊ฐ: {time}</p> | |
<hr> | |
</div> | |
""" | |
list_output += list_item | |
return list_output, "" | |
except Exception as e: | |
error_message = f"๊ฒฐ๊ณผ ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์: {str(e)}" | |
return "Error: " + error_message, "" | |
def serphouse_search(query, country): | |
# ํ์ด์ง์ ๊ฒฐ๊ณผ ์์ ๊ธฐ๋ณธ๊ฐ์ ์ค์ ํฉ๋๋ค. | |
page = 1 | |
num_result = 100 | |
results = search_serphouse(query, country, page, num_result) | |
list_output, debug_info = format_results_from_raw(results) | |
return list_output | |
css = """ | |
footer { | |
visibility: hidden; | |
} | |
/* '๋ด์ค ๊ฒฐ๊ณผ'์ '๋๋ฒ๊ทธ ์ ๋ณด' ํญ ์จ๊ธฐ๊ธฐ */ | |
#tab-๋ด์ค_๊ฒฐ๊ณผ, #tab-๋๋ฒ๊ทธ_์ ๋ณด { | |
display: none !important; | |
} | |
/* 'ํ์ด์ง'์ '๊ฒฐ๊ณผ ์' ์ ๋ ฅ ์์ ์จ๊ธฐ๊ธฐ */ | |
.slider-container { | |
display: none !important; | |
} | |
""" | |
# Gradio ์ธํฐํ์ด์ค ๊ตฌ์ฑ | |
with gr.Blocks(theme="Nymbo/Nymbo_Theme", css=css, title="NewsAI ์๋น์ค") as iface: | |
gr.Markdown("๊ฒ์์ด๋ฅผ ์ ๋ ฅํ๊ณ ์ํ๋ ๊ตญ๊ฐ๋ฅผ ์ ํํ๋ฉด, ๊ฒ์์ด์ ์ผ์นํ๋ 24์๊ฐ ์ด๋ด ๋ด์ค๋ฅผ ์ต๋ 100๊ฐ ์ถ๋ ฅํฉ๋๋ค.") | |
with gr.Tab("๊ฒ์"): | |
with gr.Row(): | |
query = gr.Textbox(label="๊ฒ์์ด") | |
country = gr.Dropdown(MAJOR_COUNTRIES, label="๊ตญ๊ฐ", value="South Korea") | |
# 'ํ์ด์ง'์ '๊ฒฐ๊ณผ ์' ์ ๋ ฅ ์์ ์ ๊ฑฐ | |
# with gr.Row(): | |
# page = gr.Slider(1, 10, 1, label="ํ์ด์ง") | |
# num_result = gr.Slider(1, 100, 100, label="๊ฒฐ๊ณผ ์") | |
search_button = gr.Button("๊ฒ์") | |
# '๋ด์ค ๊ฒฐ๊ณผ'์ '๋๋ฒ๊ทธ ์ ๋ณด' ํญ ์ ๊ฑฐ | |
# with gr.Tab("๋ด์ค ๊ฒฐ๊ณผ"): | |
# news_output = gr.HTML(label="๋ด์ค ๊ฒฐ๊ณผ") | |
with gr.Tab("๋ฆฌ์คํธ"): | |
list_output = gr.HTML(label="๋ฆฌ์คํธ ๊ฒฐ๊ณผ") # HTML๋ก ๋ณ๊ฒฝ | |
# with gr.Tab("๋๋ฒ๊ทธ ์ ๋ณด"): | |
# debug_output = gr.Textbox(label="๋๋ฒ๊ทธ ์ ๋ณด", lines=10) | |
def search_and_display(query, country): | |
list_output_text = serphouse_search(query, country) | |
return {list_output: list_output_text} | |
search_button.click( | |
search_and_display, | |
inputs=[query, country], | |
outputs=[list_output] | |
) | |
iface.launch(auth=("gini", "pick")) | |