Spaces:

820nam
/

Test

Sleeping

App Files Files Community

Test / app.py

820nam

Update app.py

c42b00b verified 9 months ago

raw

history blame

5.62 kB

	import streamlit as st
	import requests
	import matplotlib.pyplot as plt
	from transformers import pipeline
	import openai
	import pandas as pd
	import os

	OPENAI_API_KEY="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"

	# OpenAI API 키 설정
	openai.api_key = os.getenv("OPENAI_API_KEY", "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") # 환경 변수 또는 직접 키 입력

	# 네이버 뉴스 API를 통해 실제 뉴스 기사 가져오기
	def fetch_naver_news(query, display=5):
	client_id = "I_8koTJh3R5l4wLurQbG" # 네이버 개발자 센터에서 발급받은 Client ID
	client_secret = "W5oWYlAgur" # 네이버 개발자 센터에서 발급받은 Client Secret

	url = "https://openapi.naver.com/v1/search/news.json"
	headers = {
	"X-Naver-Client-Id": client_id,
	"X-Naver-Client-Secret": client_secret,
	}
	params = {
	"query": query,
	"display": display,
	"start": 1,
	"sort": "date", # 최신순으로 정렬
	}

	response = requests.get(url, headers=headers, params=params)
	if response.status_code == 200:
	news_data = response.json()
	return news_data['items'] # 뉴스 기사 리스트 반환
	else:
	st.error("뉴스 데이터를 불러오는 데 실패했습니다.")
	return []

	# 정치 성향 분석 모델 로드
	def load_sentiment_model():
	classifier = pipeline("text-classification", model="bucketresearch/politicalBiasBERT")
	return classifier

	# GPT-4를 이용해 반대 관점 기사 생성
	def generate_article_gpt4(prompt):
	try:
	response = openai.ChatCompletion.create(
	model="gpt-4",
	messages=[
	{"role": "system", "content": "You are a helpful assistant that generates articles."},
	{"role": "user", "content": prompt}
	],
	max_tokens=512,
	temperature=0.7
	)
	return response.choices[0].message.content
	except Exception as e:
	return f"Error generating text: {e}"

	# 정치 성향 분석
	def analyze_article_sentiment(text, classifier):
	result = classifier(text[:512]) # 너무 긴 텍스트는 잘라서 분석
	label = result[0]["label"]
	score = result[0]["score"]

	# 모델에서 반환하는 라벨을 "진보", "보수", "중립"으로 매핑
	if label == "LEFT":
	return "진보", score
	elif label == "RIGHT":
	return "보수", score
	else:
	return "중립", score

	# 정치적 관점 비교 및 반대 관점 생성
	def analyze_news_political_viewpoint(query):
	# 뉴스 데이터 가져오기
	news_items = fetch_naver_news(query)
	if not news_items:
	return [], {}

	classifier = load_sentiment_model()
	results = []
	sentiment_counts = {"진보": 0, "보수": 0, "중립": 0} # 매핑된 라벨에 맞게 초기화

	for item in news_items:
	title = item["title"]
	description = item["description"]
	combined_text = f"{title}. {description}"

	# 기사 성향 분석
	sentiment, score = analyze_article_sentiment(combined_text, classifier)
	sentiment_counts[sentiment] += 1 # 매핑된 키로 카운트 증가

	# 반대 관점 기사 생성
	opposite_perspective = "보수적" if sentiment == "진보" else "진보적"
	prompt = f"{combined_text}를 기반으로 {opposite_perspective} 관점의 기사를 작성해주세요."
	opposite_article = generate_article_gpt4(prompt)

	results.append({
	"제목": title,
	"원본 기사": description,
	"성향": sentiment,
	"성향 점수": score,
	"대조 관점 기사": opposite_article
	})

	return results, sentiment_counts


	# 성향 분포 시각화
	def visualize_sentiment_distribution(sentiment_counts):
	fig, ax = plt.subplots()
	labels = list(sentiment_counts.keys())
	sizes = list(sentiment_counts.values())
	ax.pie(sizes, labels=labels, autopct='%1.1f%%', startangle=90, colors=["blue", "red", "gray"])
	ax.axis("equal")
	st.pyplot(fig)

	# Streamlit 애플리케이션
	st.title("정치적 관점 비교 분석 도구")
	st.markdown("뉴스 기사의 정치 성향 분석과 반대 관점 기사를 생성하여 비교합니다.")

	query = st.text_input("검색 키워드를 입력하세요", value="정치")
	if st.button("분석 시작"):
	with st.spinner("분석 중..."):
	analysis_results, sentiment_counts = analyze_news_political_viewpoint(query)

	if analysis_results:
	st.success("뉴스 분석이 완료되었습니다.")

	# 성향 분포 시각화
	st.subheader("성향 분포 시각화")
	visualize_sentiment_distribution(sentiment_counts)

	# 상세 분석 결과 출력
	st.subheader("상세 분석 결과")
	for result in analysis_results:
	st.write(f"#### 제목: {result['제목']}")
	st.write(f"- 원본 기사: {result['원본 기사']}")
	st.write(f"- 성향: {result['성향']} (점수: {result['성향 점수']:.2f})")
	st.write(f"- 대조 관점 기사: {result['대조 관점 기사']}")
	st.write("---")
	else:
	st.error("분석된 뉴스 데이터가 없습니다.")