MoneyRadar

Building

App Files Files Community

MoneyRadar / app.py

seawolf2357

Update app.py

8aede25 verified 5 months ago

raw

history blame

8.36 kB

	import gradio as gr
	import requests
	import json
	import os
	from datetime import datetime, timedelta
	from bs4 import BeautifulSoup # 웹 페이지에서 텍스트를 추출하기 위해 사용
	from huggingface_hub import InferenceClient # LLM 사용을 위해 필요

	# 필요한 패키지 설치 (필요한 경우 주석을 제거하고 실행)
	# !pip install bs4 huggingface_hub

	# 환경 변수에서 API 키 가져오기 (API 키는 안전하게 관리되어야 합니다)
	API_KEY = os.getenv("SERPHOUSE_API_KEY") # 본인의 SerpHouse API 키를 환경 변수로 설정하세요.
	HF_TOKEN = os.getenv("HF_TOKEN") # Hugging Face API 토큰을 환경 변수로 설정하세요.

	MAJOR_COUNTRIES = [
	"United States", "United Kingdom", "Canada", "Australia", "Germany",
	"France", "Japan", "South Korea", "China", "India",
	"Brazil", "Mexico", "Russia", "Italy", "Spain",
	"Netherlands", "Sweden", "Switzerland", "Norway", "Denmark",
	"Finland", "Belgium", "Austria", "New Zealand", "Ireland",
	"Singapore", "Hong Kong", "Israel", "United Arab Emirates", "Saudi Arabia",
	"South Africa", "Turkey", "Egypt", "Poland", "Czech Republic",
	"Hungary", "Greece", "Portugal", "Argentina", "Chile",
	"Colombia", "Peru", "Venezuela", "Thailand", "Malaysia",
	"Indonesia", "Philippines", "Vietnam", "Pakistan", "Bangladesh"
	]

	def search_serphouse(query, country, page=1, num_result=100):
	url = "https://api.serphouse.com/serp/live"

	now = datetime.utcnow()
	yesterday = now - timedelta(days=1)
	date_range = f"{yesterday.strftime('%Y-%m-%d')},{now.strftime('%Y-%m-%d')}"

	payload = {
	"data": {
	"q": query,
	"domain": "google.com",
	"loc": country,
	"lang": "en",
	"device": "desktop",
	"serp_type": "news",
	"page": str(page),
	"verbatim": "1",
	"num": str(num_result),
	"date_range": date_range
	}
	}

	headers = {
	"accept": "application/json",
	"content-type": "application/json",
	"authorization": f"Bearer {API_KEY}"
	}

	try:
	response = requests.post(url, json=payload, headers=headers)
	response.raise_for_status()
	return response.json()
	except requests.RequestException as e:
	error_msg = f"Error: {str(e)}"
	if response.text:
	error_msg += f"\nResponse content: {response.text}"
	return {"error": error_msg}

	def format_results_from_raw(results):
	try:
	if isinstance(results, dict) and "error" in results:
	return "Error: " + results["error"], []

	if not isinstance(results, dict):
	raise ValueError("결과가 사전 형식이 아닙니다.")

	# 'results' 키 내부의 구조 확인 (중첩된 'results' 처리)
	if 'results' in results:
	results_content = results['results']
	if 'results' in results_content:
	results_content = results_content['results']
	# 'news' 키 확인
	if 'news' in results_content:
	news_results = results_content['news']
	else:
	news_results = []
	else:
	news_results = []
	else:
	news_results = []

	if not news_results:
	return "검색 결과가 없습니다.", []

	articles = []

	for idx, result in enumerate(news_results, 1):
	title = result.get("title", "제목 없음")
	link = result.get("url", result.get("link", "#"))
	snippet = result.get("snippet", "내용 없음")
	channel = result.get("channel", result.get("source", "알 수 없음"))
	time = result.get("time", result.get("date", "알 수 없는 시간"))
	image_url = result.get("img", result.get("thumbnail", ""))

	articles.append({
	"index": idx,
	"title": title,
	"link": link,
	"snippet": snippet,
	"channel": channel,
	"time": time,
	"image_url": image_url
	})

	return "", articles

	except Exception as e:
	error_message = f"결과 처리 중 오류 발생: {str(e)}"
	return "Error: " + error_message, []

	def serphouse_search(query, country):
	# 페이지와 결과 수의 기본값을 설정합니다.
	page = 1
	num_result = 100
	results = search_serphouse(query, country, page, num_result)
	error_message, articles = format_results_from_raw(results)
	return error_message, articles

	# LLM 설정
	hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus-08-2024", token=HF_TOKEN)

	def summarize_article(url):
	try:
	# 웹 페이지에서 텍스트 추출
	response = requests.get(url)
	response.raise_for_status()
	soup = BeautifulSoup(response.text, 'html.parser')
	# 모든 텍스트를 추출 (간단한 예시)
	text = ' '.join([p.get_text() for p in soup.find_all('p')])
	if not text.strip():
	return "기사 내용을 가져올 수 없습니다."

	# 요약 생성
	prompt = f"다음 영어 기사를 한국어로 3문장으로 요약하세요:\n{text}"
	summary = hf_client.text_generation(prompt, max_new_tokens=500)
	return summary
	except Exception as e:
	return f"요약 중 오류 발생: {str(e)}"

	css = """
	footer {
	visibility: hidden;
	}
	"""

	# Gradio 인터페이스 구성
	with gr.Blocks(css=css, title="NewsAI 서비스") as iface:
	gr.Markdown("검색어를 입력하고 원하는 국가를 선택하면, 검색어와 일치하는 24시간 이내 뉴스를 최대 100개 출력합니다.")

	with gr.Column():
	with gr.Row():
	query = gr.Textbox(label="검색어")
	country = gr.Dropdown(MAJOR_COUNTRIES, label="국가", value="South Korea")
	search_button = gr.Button("검색")

	output_table = gr.HTML()
	summary_output = gr.Markdown(visible=False)

	def search_and_display(query, country):
	error_message, articles = serphouse_search(query, country)
	if error_message:
	return f"<p>{error_message}</p>", gr.update(visible=False)
	else:
	# 기사 목록을 HTML 테이블로 생성
	table_html = "<table border='1' style='width:100%; text-align:left;'><tr><th>번호</th><th>제목</th><th>출처</th><th>시간</th><th>분석</th></tr>"
	for article in articles:
	# 각 기사에 대해 버튼에 해당하는 JavaScript 코드를 삽입
	analyze_button = f"""<button onclick="analyzeArticle('{article['link']}')">분석</button>"""
	row = f"""
	<tr>
	<td>{article['index']}</td>
	<td><a href="{article['link']}" target="_blank">{article['title']}</a></td>
	<td>{article['channel']}</td>
	<td>{article['time']}</td>
	<td>{analyze_button}</td>
	</tr>
	"""
	table_html += row
	table_html += "</table>"

	# JavaScript 함수 정의
	js_code = """
	<script>
	function analyzeArticle(url) {
	// Gradio의 handle_function을 사용하여 Python 함수 호출
	gradioApp().querySelector('#article_url_input textarea').value = url;
	gradioApp().querySelector('#analyze_button').click();
	}
	</script>
	"""

	full_html = table_html + js_code

	return full_html, gr.update(visible=True, value="") # summary_output 초기화

	def analyze_article(url):
	summary = summarize_article(url)
	return summary

	article_url_input = gr.Textbox(visible=False, elem_id="article_url_input")
	analyze_button = gr.Button("분석", visible=False, elem_id="analyze_button")

	search_button.click(
	search_and_display,
	inputs=[query, country],
	outputs=[output_table, summary_output]
	)

	analyze_button.click(
	analyze_article,
	inputs=[article_url_input],
	outputs=[summary_output]
	)

	iface.launch(auth=("gini", "pick"))