Jintonic92's picture
Update app.py
8181918 verified
raw
history blame
24.3 kB
import streamlit as st
import pandas as pd
import os
from src.SecondModule.module2 import SimilarQuestionGenerator
from src.ThirdModule.module3 import AnswerVerifier
import logging
from typing import Optional, Tuple
logging.basicConfig(level=logging.DEBUG)
# Streamlit νŽ˜μ΄μ§€ κΈ°λ³Έ μ„€μ •
st.set_page_config(
page_title="MisconcepTutor",
layout="wide",
initial_sidebar_state="expanded"
)
@st.cache_resource
def load_answer_verifier():
"""λ‹΅μ•ˆ 검증 λͺ¨λΈ λ‘œλ“œ"""
from src.ThirdModule.module3 import AnswerVerifier
return AnswerVerifier()
# 경둜 μ„€μ •
base_path = os.path.dirname(os.path.abspath(__file__))
data_path = os.path.join(base_path, 'Data')
misconception_csv_path = os.path.join(data_path, 'misconception_mapping.csv')
# λ‘œκΉ… μ„€μ •
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
# μ„Έμ…˜ μƒνƒœ μ΄ˆκΈ°ν™” - κ°€μž₯ λ¨Όμ € μ‹€ν–‰λ˜λ„λ‘ μ΅œμƒλ‹¨μ— 배치
if 'initialized' not in st.session_state:
st.session_state.initialized = True
st.session_state.wrong_questions = []
st.session_state.misconceptions = []
st.session_state.current_question_index = 0
st.session_state.generated_questions = []
st.session_state.current_step = 'initial'
st.session_state.selected_wrong_answer = None
st.session_state.questions = []
logger.info("Session state initialized")
# 문제 생성기 μ΄ˆκΈ°ν™”
@st.cache_resource
def load_question_generator():
"""문제 생성 λͺ¨λΈ λ‘œλ“œ"""
if not os.path.exists(misconception_csv_path):
st.error(f"CSV 파일이 μ‘΄μž¬ν•˜μ§€ μ•ŠμŠ΅λ‹ˆλ‹€: {misconception_csv_path}")
raise FileNotFoundError(f"CSV 파일이 μ‘΄μž¬ν•˜μ§€ μ•ŠμŠ΅λ‹ˆλ‹€: {misconception_csv_path}")
return SimilarQuestionGenerator(misconception_csv_path=misconception_csv_path)
# CSV 데이터 λ‘œλ“œ ν•¨μˆ˜
@st.cache_data
def load_data(data_file = '/train.csv'):
try:
file_path = os.path.join(data_path, data_file.lstrip('/'))
df = pd.read_csv(file_path)
logger.info(f"Data loaded successfully from {file_path}")
return df
except FileNotFoundError:
st.error(f"νŒŒμΌμ„ 찾을 수 μ—†μŠ΅λ‹ˆλ‹€: {data_file}")
logger.error(f"File not found: {data_file}")
return None
def start_quiz():
"""ν€΄μ¦ˆ μ‹œμž‘ 및 μ΄ˆκΈ°ν™”"""
df = load_data()
if df is None or df.empty:
st.error("데이터λ₯Ό 뢈러올 수 μ—†μŠ΅λ‹ˆλ‹€. 데이터셋을 ν™•μΈν•΄μ£Όμ„Έμš”.")
return
st.session_state.questions = df.sample(n=10, random_state=42)
st.session_state.current_step = 'quiz'
st.session_state.current_question_index = 0
st.session_state.wrong_questions = []
st.session_state.misconceptions = []
st.session_state.generated_questions = []
logger.info("Quiz started")
def generate_similar_question(wrong_q, misconception_id, generator):
"""μœ μ‚¬ 문제 생성"""
logger.info(f"Generating similar question for misconception_id: {misconception_id}")
# μž…λ ₯ 데이터 μœ νš¨μ„± 검사
if not isinstance(wrong_q, dict):
logger.error(f"Invalid wrong_q type: {type(wrong_q)}")
st.error("μœ μ‚¬ 문제 생성에 ν•„μš”ν•œ 데이터 ν˜•μ‹μ΄ 잘λͺ»λ˜μ—ˆμŠ΅λ‹ˆλ‹€.")
return None
try:
# misconception_idκ°€ μ—†κ±°λ‚˜ NaN인 경우 λ‹€λ₯Έ misconception μ‚¬μš©
if pd.isna(misconception_id):
logger.info("Original misconception_id is NaN, trying to find alternative")
# ν˜„μž¬κΉŒμ§€ λ‚˜μ˜¨ misconceptionλ“€ μ€‘μ—μ„œ 선택
available_misconceptions = [m for m in st.session_state.misconceptions if not pd.isna(m)]
if available_misconceptions:
# κ°€μž₯ μ΅œκ·Όμ— λ‚˜μ˜¨ misconception 선택
misconception_id = available_misconceptions[-1]
logger.info(f"Using alternative misconception_id: {misconception_id}")
else:
# κΈ°λ³Έ misconception ID μ‚¬μš© (예: κ°€μž₯ 기본적인 misconception)
misconception_id = 2001 # μ μ ˆν•œ κΈ°λ³Έκ°’μœΌλ‘œ μˆ˜μ • ν•„μš”
logger.info(f"Using default misconception_id: {misconception_id}")
# 데이터 μ€€λΉ„ (νŠœν”Œ λ³€ν™˜ λ°©μ§€)
input_data = {
'construct_name': str(wrong_q.get('ConstructName', '')),
'subject_name': str(wrong_q.get('SubjectName', '')),
'question_text': str(wrong_q.get('QuestionText', '')),
'correct_answer_text': str(wrong_q.get(f'Answer{wrong_q["CorrectAnswer"]}Text', '')),
'wrong_answer_text': str(wrong_q.get(f'Answer{st.session_state.selected_wrong_answer}Text', '')),
'misconception_id': int(misconception_id)
}
logger.info(f"Prepared input data: {input_data}")
with st.spinner("πŸ“ μœ μ‚¬ 문제λ₯Ό μƒμ„±ν•˜κ³  μžˆμŠ΅λ‹ˆλ‹€..."):
# μœ μ‚¬ 문제 생성 호좜
generated_q, _ = generator.generate_similar_question_with_text(
construct_name=input_data['construct_name'],
subject_name=input_data['subject_name'],
question_text=input_data['question_text'],
correct_answer_text=input_data['correct_answer_text'],
wrong_answer_text=input_data['wrong_answer_text'],
misconception_id=input_data['misconception_id']
)
if generated_q:
verifier = load_answer_verifier()
with st.status("πŸ€” AIκ°€ 문제λ₯Ό κ²€ν† ν•˜κ³  μžˆμŠ΅λ‹ˆλ‹€..."):
st.write("λ‹΅μ•ˆμ˜ 정확성을 κ²€μ¦ν•˜κ³  μžˆμŠ΅λ‹ˆλ‹€...")
verified_answer = verifier.verify_answer(
question=generated_q.question,
choices=generated_q.choices
)
if verified_answer:
logger.info(f"Answer verified: {verified_answer}")
st.write("βœ… 검증 μ™„λ£Œ!")
result = {
'question': generated_q.question,
'choices': generated_q.choices,
'correct': verified_answer,
'explanation': generated_q.explanation
}
st.session_state['current_similar_question_answer'] = verified_answer
return result
else:
logger.warning("Answer verification failed, using original answer")
st.write("⚠️ 검증에 μ‹€νŒ¨ν–ˆμŠ΅λ‹ˆλ‹€. 원본 λ‹΅μ•ˆμ„ μ‚¬μš©ν•©λ‹ˆλ‹€.")
result = {
'question': generated_q.question,
'choices': generated_q.choices,
'correct': generated_q.correct_answer,
'explanation': generated_q.explanation
}
st.session_state['current_similar_question_answer'] = generated_q.correct_answer
return result
except Exception as e:
logger.error(f"Error in generate_similar_question: {str(e)}")
st.error(f"문제 생성 쀑 였λ₯˜κ°€ λ°œμƒν–ˆμŠ΅λ‹ˆλ‹€: {str(e)}")
return None
return None
def handle_answer(answer, current_q):
"""λ‹΅λ³€ 처리"""
if answer != current_q['CorrectAnswer']:
wrong_q_dict = current_q.to_dict()
st.session_state.wrong_questions.append(wrong_q_dict)
st.session_state.selected_wrong_answer = answer
misconception_key = f'Misconception{answer}Id'
misconception_id = current_q.get(misconception_key)
st.session_state.misconceptions.append(misconception_id)
st.session_state.current_question_index += 1
if st.session_state.current_question_index >= 10:
st.session_state.current_step = 'review'
def format_latex_expression(text: str) -> str:
"""μˆ˜ν•™ ν‘œν˜„μ‹μ„ LaTeX ν˜•μ‹μœΌλ‘œ λ³€ν™˜"""
import re
# μ΄νƒ€λ¦­μ²΄λ‘œ ν‘œμ‹œν•  μˆ˜ν•™ μš©μ–΄λ“€
math_terms = ['decimalplaces', 'rounded to', 'What is']
def replace_math_terms(match):
term = match.group(0)
return f'\\text{{{term}}}'
# ν…μŠ€νŠΈ μ „μ²˜λ¦¬
text = text.replace('\\(', '\\left(')
text = text.replace('\\)', '\\right)')
# μˆ˜ν•™ μš©μ–΄λ₯Ό LaTeX ν…μŠ€νŠΈλ‘œ λ³€ν™˜
for term in math_terms:
text = text.replace(term, f'\\text{{{term}}}')
# λ‹¬λŸ¬ 기호($) 처리
text = text.replace('$(', '\\$\\left(')
text = text.replace(')$', '\\right)\\$')
# 특수 νŒ¨ν„΄ 처리
replacements = {
r'\\div': '\\div',
r'\\ldots': '\\ldots',
r'\\dots': '\\dots',
r'\\times': '\\times',
}
for old, new in replacements.items():
text = text.replace(old, new)
# κ΄„ν˜Έλ‘œ λ‘˜λŸ¬μ‹ΈμΈ μˆ˜μ‹ 처리
def process_math(match):
content = match.group(1)
return f'\\left({content}\\right)'
text = re.sub(r'\(([\d\.\s]+)\)', process_math, text)
# μ΅œμ’… LaTeX μˆ˜μ‹μœΌλ‘œ 감싸기
if not text.startswith('$') and not text.endswith('$'):
text = f'$${text}$$'
return text
def format_question(question: str) -> str:
"""문제 ν…μŠ€νŠΈλ₯Ό LaTeX ν˜•μ‹μœΌλ‘œ λ³€ν™˜"""
# 색상이 μžˆλŠ” ν…μŠ€νŠΈ 처리
colored_text_pattern = r'\\textcolor{([^}]+)}{([^}]+)}'
def process_colored_text(match):
color = match.group(1)
text = match.group(2)
return f'\\textcolor{{{color}}}{{{format_latex_expression(text)}}}'
question = re.sub(colored_text_pattern, process_colored_text, question)
return format_latex_expression(question)
def format_answer_choice(choice: str) -> str:
"""선택지 ν…μŠ€νŠΈλ₯Ό LaTeX ν˜•μ‹μœΌλ‘œ λ³€ν™˜"""
# λ‹¬λŸ¬ κΈ°ν˜Έκ°€ ν¬ν•¨λœ 선택지 νŠΉλ³„ 처리
if '$' in choice:
# λ‹¬λŸ¬ 기호λ₯Ό LaTeX λͺ…λ Ήμ–΄λ‘œ λ³€ν™˜
choice = choice.replace('$', '\\$')
return format_latex_expression(choice)
def display_math_content(content: str, is_question: bool = True):
"""μˆ˜ν•™ λ‚΄μš©(문제 λ˜λŠ” λ‹΅μ•ˆ) ν‘œμ‹œ"""
formatted_content = format_math_expression(content)
if is_question:
st.markdown(formatted_content)
else:
# μ„ νƒμ§€μ˜ 경우 μΆ”κ°€ ν¬λ§·νŒ… ν•„μš”ν•  수 있음
return formatted_content
def main():
"""메인 μ• ν”Œλ¦¬μΌ€μ΄μ…˜ 둜직"""
st.title("MisconcepTutor")
# Generator μ΄ˆκΈ°ν™”
generator = load_question_generator()
# 초기 ν™”λ©΄
if st.session_state.current_step == 'initial':
st.write("#### ν•™μŠ΅μ„ μ‹œμž‘ν•˜κ² μŠ΅λ‹ˆλ‹€. 10개의 문제λ₯Ό ν’€μ–΄λ³ΌκΉŒμš”?")
if st.button("ν•™μŠ΅ μ‹œμž‘", key="start_quiz"):
start_quiz()
st.rerun()
# ν€΄μ¦ˆ ν™”λ©΄
elif st.session_state.current_step == 'quiz':
current_q = st.session_state.questions.iloc[st.session_state.current_question_index]
# μ§„ν–‰ 상황 ν‘œμ‹œ
progress = st.session_state.current_question_index / 10
st.progress(progress)
st.write(f"### 문제 {st.session_state.current_question_index + 1}/10")
# 문제 ν‘œμ‹œ
st.markdown("---")
display_math_question(current_q['QuestionText'])
#st.write(current_q['QuestionText'])
# # 보기 ν‘œμ‹œ
# col1, col2 = st.columns(2)
# with col1:
# if st.button(f"A) {current_q['AnswerAText']}", key="A"):
# handle_answer('A', current_q)
# st.rerun()
# if st.button(f"C) {current_q['AnswerCText']}", key="C"):
# handle_answer('C', current_q)
# st.rerun()
# with col2:
# if st.button(f"B) {current_q['AnswerBText']}", key="B"):
# handle_answer('B', current_q)
# st.rerun()
# if st.button(f"D) {current_q['AnswerDText']}", key="D"):
# handle_answer('D', current_q)
# st.rerun()
# 보기 ν‘œμ‹œ
col1, col2 = st.columns(2)
with col1:
if st.button(f"A) {format_math_expression(current_q['AnswerAText'])}", key="A"):
handle_answer('A', current_q)
st.rerun()
if st.button(f"C) {format_math_expression(current_q['AnswerCText'])}", key="C"):
handle_answer('C', current_q)
st.rerun()
with col2:
if st.button(f"B) {format_math_expression(current_q['AnswerBText'])}", key="B"):
handle_answer('B', current_q)
st.rerun()
if st.button(f"D) {format_math_expression(current_q['AnswerDText'])}", key="D"):
handle_answer('D', current_q)
st.rerun()
# 볡슡 ν™”λ©΄
elif st.session_state.current_step == 'review':
st.write("### ν•™μŠ΅ κ²°κ³Ό")
# κ²°κ³Ό 톡계
col1, col2, col3 = st.columns(3)
col1.metric("총 문제 수", 10)
col2.metric("λ§žμ€ 문제", 10 - len(st.session_state.wrong_questions))
col3.metric("ν‹€λ¦° 문제", len(st.session_state.wrong_questions))
# 결과에 λ”°λ₯Έ λ©”μ‹œμ§€ ν‘œμ‹œ
if len(st.session_state.wrong_questions) == 0:
st.balloons() # μΆ•ν•˜ 효과
st.success("πŸŽ‰ μΆ•ν•˜ν•©λ‹ˆλ‹€! λͺ¨λ“  문제λ₯Ό λ§žμΆ”μ…¨μ–΄μš”!")
st.markdown("""
### πŸ† μˆ˜ν•™μ™•μ΄μ‹­λ‹ˆλ‹€!
μ™„λ²½ν•œ 점수λ₯Ό λ°›μœΌμ…¨λ„€μš”! μˆ˜ν•™μ  κ°œλ…μ„ μ •ν™•ν•˜κ²Œ μ΄ν•΄ν•˜κ³  계신 것 κ°™μŠ΅λ‹ˆλ‹€.
""")
elif len(st.session_state.wrong_questions) <= 3:
st.success("잘 ν•˜μ…¨μ–΄μš”! 쑰금만 더 μ—°μŠ΅ν•˜λ©΄ μ™„λ²½ν•  κ±°μ˜ˆμš”!")
else:
st.info("천천히 κ°œλ…μ„ λ³΅μŠ΅ν•΄λ³΄μ•„μš”. μ—°μŠ΅ν•˜λ‹€ 보면 λŠ˜μ–΄λ‚  κ±°μ˜ˆμš”!")
# λ„€λΉ„κ²Œμ΄μ…˜ λ²„νŠΌ
col1, col2 = st.columns(2)
with col1:
if st.button("πŸ”„ μƒˆλ‘œμš΄ 문제 μ„ΈνŠΈ μ‹œμž‘ν•˜κΈ°", use_container_width=True):
start_quiz()
st.rerun()
with col2:
if st.button("🏠 처음으둜 λŒμ•„κ°€κΈ°", use_container_width=True):
st.session_state.clear()
st.rerun()
# ν‹€λ¦° 문제 뢄석 λΆ€λΆ„
if st.session_state.wrong_questions:
st.write("### ✍️ ν‹€λ¦° 문제 뢄석")
tabs = st.tabs([f"πŸ“ ν‹€λ¦° 문제 #{i + 1}" for i in range(len(st.session_state.wrong_questions))])
for i, (tab, (wrong_q, misconception_id)) in enumerate(zip(
tabs,
zip(st.session_state.wrong_questions, st.session_state.misconceptions)
)):
with tab:
st.write("**πŸ“‹ 문제:**")
st.write(wrong_q['QuestionText'])
st.write("**βœ… μ •λ‹΅:**", wrong_q['CorrectAnswer'])
st.write("---")
st.write("**πŸ” κ΄€λ ¨λœ Misconception:**")
if misconception_id and not pd.isna(misconception_id):
misconception_text = generator.get_misconception_text(misconception_id)
st.info(f"Misconception ID: {int(misconception_id)}\n\n{misconception_text}")
else:
st.info("Misconception 정보가 μ—†μŠ΅λ‹ˆλ‹€.")
if st.button(f"πŸ“š μœ μ‚¬ 문제 ν’€κΈ°", key=f"retry_{i}"):
st.session_state[f"show_similar_question_{i}"] = True
st.session_state[f"similar_question_answered_{i}"] = False
st.rerun()
if st.session_state.get(f"show_similar_question_{i}", False):
st.divider()
new_question = generate_similar_question(wrong_q, misconception_id, generator)
if new_question:
st.write("### 🎯 μœ μ‚¬ 문제")
#st.write(new_question['question'])
display_math_question(new_question['question'])
# λ‹΅λ³€ μƒνƒœ 확인
answered = st.session_state.get(f"similar_question_answered_{i}", False)
# 보기 ν‘œμ‹œ
st.write("**보기:**")
col1, col2 = st.columns(2)
# # λ‹΅λ³€ν•˜μ§€ μ•Šμ€ κ²½μš°μ—λ§Œ λ²„νŠΌ ν™œμ„±ν™”
# if not answered:
# with col1:
# for option in ['A', 'C']:
# if st.button(
# f"{option}) {new_question['choices'][option]}",
# key=f"similar_{option}_{i}"
# ):
# st.session_state[f"similar_question_answered_{i}"] = True
# st.session_state[f"selected_answer_{i}"] = option
# correct_answer = st.session_state.get('current_similar_question_answer')
# if option == correct_answer:
# st.session_state[f"is_correct_{i}"] = True
# else:
# st.session_state[f"is_correct_{i}"] = False
# st.rerun()
# with col2:
# for option in ['B', 'D']:
# if st.button(
# f"{option}) {new_question['choices'][option]}",
# key=f"similar_{option}_{i}"
# ):
# st.session_state[f"similar_question_answered_{i}"] = True
# st.session_state[f"selected_answer_{i}"] = option
# correct_answer = st.session_state.get('current_similar_question_answer')
# if option == correct_answer:
# st.session_state[f"is_correct_{i}"] = True
# else:
# st.session_state[f"is_correct_{i}"] = False
# st.rerun()
# λ‹΅λ³€ν•˜μ§€ μ•Šμ€ κ²½μš°μ—λ§Œ λ²„νŠΌ ν™œμ„±ν™”
if not answered:
with col1:
for option in ['A', 'C']:
if st.button(
f"{option}) {format_math_expression(new_question['choices'][option])}",
key=f"similar_{option}_{i}"
):
st.session_state[f"similar_question_answered_{i}"] = True
st.session_state[f"selected_answer_{i}"] = option
correct_answer = st.session_state.get('current_similar_question_answer')
if option == correct_answer:
st.session_state[f"is_correct_{i}"] = True
else:
st.session_state[f"is_correct_{i}"] = False
st.rerun()
with col2:
for option in ['B', 'D']:
if st.button(
f"{option}) {format_math_expression(new_question['choices'][option])}",
key=f"similar_{option}_{i}"
):
st.session_state[f"similar_question_answered_{i}"] = True
st.session_state[f"selected_answer_{i}"] = option
correct_answer = st.session_state.get('current_similar_question_answer')
if option == correct_answer:
st.session_state[f"is_correct_{i}"] = True
else:
st.session_state[f"is_correct_{i}"] = False
st.rerun()
# λ‹΅λ³€ν•œ 경우 κ²°κ³Ό ν‘œμ‹œ
if answered:
is_correct = st.session_state.get(f"is_correct_{i}", False)
correct_answer = st.session_state.get('current_similar_question_answer')
if is_correct:
st.success("βœ… μ •λ‹΅μž…λ‹ˆλ‹€!")
else:
st.error(f"❌ ν‹€λ ΈμŠ΅λ‹ˆλ‹€. 정닡은 {correct_answer}μž…λ‹ˆλ‹€.")
# ν•΄μ„€ ν‘œμ‹œ
st.write("---")
st.write("**πŸ“ ν•΄μ„€:**", new_question['explanation'])
# λ‹€μ‹œ ν’€κΈ° λ²„νŠΌ
if st.button("πŸ”„ λ‹€μ‹œ ν’€κΈ°", key=f"reset_{i}"):
st.session_state[f"similar_question_answered_{i}"] = False
st.session_state[f"selected_answer_{i}"] = None
st.session_state[f"is_correct_{i}"] = None
st.rerun()
# 문제 λ‹«κΈ° λ²„νŠΌ
if st.button("❌ 문제 λ‹«κΈ°", key=f"close_{i}"):
st.session_state[f"show_similar_question_{i}"] = False
st.session_state[f"similar_question_answered_{i}"] = False
st.session_state[f"selected_answer_{i}"] = None
st.session_state[f"is_correct_{i}"] = None
st.rerun()
# ν™”λ©΄ μ•„λž˜ μ—¬λ°± μΆ”κ°€
st.markdown("<br>" * 5, unsafe_allow_html=True) # 5μ€„μ˜ 빈 쀄 μΆ”κ°€
st.markdown("""
<div style="height: 100px;">
</div>
""", unsafe_allow_html=True) # μΆ”κ°€ μ—¬λ°±
else:
st.error("μœ μ‚¬ 문제λ₯Ό 생성할 수 μ—†μŠ΅λ‹ˆλ‹€.")
if st.button("❌ λ‹«κΈ°", key=f"close_error_{i}"):
st.session_state[f"show_similar_question_{i}"] = False
st.rerun()
# ν™”λ©΄ μ•„λž˜ μ—¬λ°± μΆ”κ°€
st.markdown("<br>" * 5, unsafe_allow_html=True) # 5μ€„μ˜ 빈 쀄 μΆ”κ°€
st.markdown("""
<div style="height: 100px;">
</div>
""", unsafe_allow_html=True) # μΆ”κ°€ μ—¬λ°±
if __name__ == "__main__":
main()
# random_state 42μ—μ„œ μ •λ‹΅
# D C A A C
# A B B B B