Spaces:
Running
Running
File size: 5,795 Bytes
12d3fa4 f2842d4 1ee305b f2842d4 0d52d72 f2842d4 e420980 f2842d4 eb43e13 f4723df eb43e13 f2842d4 1ee305b f4723df f2842d4 eb43e13 f2842d4 eb43e13 f2842d4 4e396cb f2842d4 606cff4 f2842d4 12d3fa4 eb43e13 57624e4 fbd003b 57624e4 f2842d4 46b3475 f7bc11a eb43e13 f7bc11a 46b3475 f7bc11a fbd003b 46b3475 e420980 f7bc11a e420980 eb43e13 4172426 12d3fa4 eb43e13 4172426 e420980 4172426 e420980 eb43e13 4172426 e420980 46b3475 fbd003b 46b3475 f2842d4 fbd003b f2842d4 fbd003b c56613a f2842d4 12d3fa4 f2842d4 46b3475 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 |
import gradio as gr
import requests
import json
from datetime import datetime, timedelta
API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"
MAJOR_COUNTRIES = [
"United States", "United Kingdom", "Canada", "Australia", "Germany",
"France", "Japan", "South Korea", "China", "India",
"Brazil", "Mexico", "Russia", "Italy", "Spain",
"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark",
"Finland", "Belgium", "Austria", "New Zealand", "Ireland",
"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia",
"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic",
"Hungary", "Greece", "Portugal", "Argentina", "Chile",
"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia",
"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
]
def search_serphouse(query, country, page, num_result):
url = "https://api.serphouse.com/serp/live"
now = datetime.utcnow()
yesterday = now - timedelta(days=1)
date_range = f"{yesterday.strftime('%Y-%m-%d')},{now.strftime('%Y-%m-%d')}"
payload = {
"data": {
"q": query,
"domain": "google.com",
"loc": country,
"lang": "en",
"device": "desktop",
"serp_type": "news",
"page": str(page),
"verbatim": "1",
"num": str(num_result),
"date_range": date_range
}
}
headers = {
"accept": "application/json",
"content-type": "application/json",
"authorization": f"Bearer {API_KEY}"
}
try:
response = requests.post(url, json=payload, headers=headers)
response.raise_for_status()
return response.json()
except requests.RequestException as e:
error_msg = f"Error: {str(e)}"
if response.text:
error_msg += f"\nResponse content: {response.text}"
return {"error": error_msg}
def format_results_from_raw(results):
try:
debug_info = f"Raw API Response:\n{json.dumps(results, indent=2, ensure_ascii=False)}"
if isinstance(results, dict) and "error" in results:
return "Error: " + results["error"], debug_info
if not isinstance(results, dict):
raise ValueError("๊ฒฐ๊ณผ๊ฐ ์ฌ์ ํ์์ด ์๋๋๋ค.")
# 'results' ํค ๋ด๋ถ์ ๊ตฌ์กฐ ํ์ธ
if 'results' in results:
results_content = results['results']
# 'news' ํค ํ์ธ
if 'news' in results_content:
news_results = results_content['news']
else:
news_results = []
else:
news_results = []
if not news_results:
return "๊ฒ์ ๊ฒฐ๊ณผ๊ฐ ์์ต๋๋ค.", debug_info
formatted_articles = ""
for result in news_results:
title = result.get("title", "์ ๋ชฉ ์์")
link = result.get("url", result.get("link", "#"))
snippet = result.get("snippet", "๋ด์ฉ ์์")
channel = result.get("channel", result.get("source", "์ ์ ์์"))
time = result.get("time", result.get("date", "์ ์ ์๋ ์๊ฐ"))
image_url = result.get("img", result.get("thumbnail", ""))
# base64๋ก ์ธ์ฝ๋ฉ๋ ์ด๋ฏธ์ง๋ฅผ ์ฒ๋ฆฌํ์ง ์์
if image_url and not image_url.startswith("data:image"):
image_html = f'<img src="{image_url}" alt="Image" style="max-width: 100%; height: auto;">'
else:
image_html = ''
article_html = f"""
<div style="margin-bottom: 20px; border-bottom: 1px solid #ccc; padding-bottom: 20px;">
<h3><a href="{link}" target="_blank">{title}</a></h3>
<p><strong>{channel}</strong> - {time}</p>
{image_html}
<p>{snippet}</p>
</div>
"""
formatted_articles += article_html
return formatted_articles, debug_info
except Exception as e:
error_message = f"๊ฒฐ๊ณผ ์ฒ๋ฆฌ ์ค ์ค๋ฅ ๋ฐ์: {str(e)}"
debug_info = f"Error: {error_message}\n"
return "Error: " + error_message, debug_info
def serphouse_search(query, country, page, num_result):
results = search_serphouse(query, country, page, num_result)
formatted_articles, debug_info = format_results_from_raw(results)
return formatted_articles, debug_info
css = """
footer {
visibility: hidden;
}
"""
# Gradio ์ธํฐํ์ด์ค ๊ตฌ์ฑ
with gr.Blocks(css=css, title="24์๊ฐ ์ด๋ด ๋ด์ค ๊ฒ์ ์ธํฐํ์ด์ค") as iface:
gr.Markdown("## 24์๊ฐ ์ด๋ด ๋ด์ค ๊ฒ์ ์ธํฐํ์ด์ค")
gr.Markdown("๊ฒ์์ด๋ฅผ ์
๋ ฅํ๊ณ ๊ตญ๊ฐ๋ฅผ ์ ํํ์ฌ 24์๊ฐ ์ด๋ด์ ๋ด์ค ๊ฒฐ๊ณผ๋ฅผ ๊ฐ์ ธ์ต๋๋ค.")
with gr.Tab("๊ฒ์"):
with gr.Row():
query = gr.Textbox(label="๊ฒ์์ด")
country = gr.Dropdown(MAJOR_COUNTRIES, label="๊ตญ๊ฐ", value="South Korea")
with gr.Row():
page = gr.Slider(1, 10, 1, label="ํ์ด์ง")
num_result = gr.Slider(1, 100, 10, label="๊ฒฐ๊ณผ ์")
search_button = gr.Button("๊ฒ์")
with gr.Tab("๋ด์ค ๊ฒฐ๊ณผ"):
news_output = gr.HTML(label="๋ด์ค ๊ฒฐ๊ณผ")
with gr.Tab("๋๋ฒ๊ทธ ์ ๋ณด"):
debug_output = gr.Textbox(label="๋๋ฒ๊ทธ ์ ๋ณด", lines=10)
def search_and_display(query, country, page, num_result):
articles, debug_info = serphouse_search(query, country, page, num_result)
return {news_output: articles, debug_output: debug_info}
search_button.click(
search_and_display,
inputs=[query, country, page, num_result],
outputs=[news_output, debug_output]
)
iface.launch(auth=("gini", "pick"))
|