Spaces:

techindia2025
/

medbot_2

Running on Zero

App Files Files Community

Thanush commited on May 22

Commit

f3b4260

1 Parent(s): 01a984c

Refactor app.py to implement LangChain memory for enhanced conversation tracking. Update prompt building and response generation logic to utilize full conversation context, improving user interaction and medical assessment accuracy.

Browse files

Files changed (1) hide show

app.py +58 -27

app.py CHANGED Viewed

@@ -68,7 +68,10 @@ meditron_model = AutoModelForCausalLM.from_pretrained(
 )
 print("Meditron model loaded successfully!")
-# Simple conversation state tracking
 conversation_state = {
     'name': None,
     'age': None,
@@ -95,13 +98,19 @@ def get_meditron_suggestions(patient_info):
     suggestion = meditron_tokenizer.decode(outputs[0][inputs.input_ids.shape[1]:], skip_special_tokens=True)
     return suggestion
-def build_simple_prompt(system_prompt, conversation_history, current_input):
-    """Build a simple prompt for Llama-2"""
     prompt = f"<s>[INST] <<SYS>>\n{system_prompt}\n<</SYS>>\n\n"
-    # Add conversation history
-    for i, (user_msg, bot_msg) in enumerate(conversation_history):
-        prompt += f"{user_msg} [/INST] {bot_msg} </s><s>[INST] "
     # Add current input
     prompt += f"{current_input} [/INST] "
@@ -110,7 +119,7 @@ def build_simple_prompt(system_prompt, conversation_history, current_input):
 @spaces.GPU
 def generate_response(message, history):
-    """Generate a response using simple state tracking."""
     global conversation_state
     # Reset state if this is a new conversation
@@ -122,35 +131,44 @@ def generate_response(message, history):
             'has_name': False,
             'has_age': False
         }
     # Step 1: Ask for name if not provided
     if not conversation_state['has_name']:
         conversation_state['has_name'] = True
-        return "Hello! Before we discuss your health concerns, could you please tell me your name?"
     # Step 2: Store name and ask for age
     if conversation_state['name'] is None:
         conversation_state['name'] = message.strip()
-        return f"Nice to meet you, {conversation_state['name']}! Could you please tell me your age?"
     # Step 3: Store age and start medical questions
     if not conversation_state['has_age']:
         conversation_state['age'] = message.strip()
         conversation_state['has_age'] = True
-        return f"Thank you, {conversation_state['name']}! Now, what brings you here today? Please tell me about any symptoms or health concerns you're experiencing."
-    # Step 4: Medical consultation phase
     conversation_state['medical_turns'] += 1
-    # Prepare conversation history for the model
-    medical_history = []
-    if len(history) >= 3:  # Skip name/age exchanges
-        medical_history = history[3:]
-    # Build the prompt for medical consultation
     if conversation_state['medical_turns'] <= 5:
         # Still gathering information - let LLM ask intelligent follow-up questions
-        prompt = build_simple_prompt(SYSTEM_PROMPT, medical_history, message)
         # Generate response with intelligent follow-up questions
         inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
@@ -168,21 +186,31 @@ def generate_response(message, history):
         full_response = tokenizer.decode(outputs[0], skip_special_tokens=True)
         llama_response = full_response.split('[/INST]')[-1].strip()
         return llama_response
     else:
         # Time for diagnosis and treatment (after 5+ turns)
-        # Compile patient information
         patient_info = f"Patient: {conversation_state['name']}, Age: {conversation_state['age']}\n\n"
-        patient_info += "Symptoms and Information:\n"
-        # Add all medical conversation history
-        for user_msg, bot_msg in medical_history:
-            patient_info += f"Patient: {user_msg}\n"
-        patient_info += f"Patient: {message}\n"
-        # Generate diagnosis with Llama-2
-        diagnosis_prompt = f"<s>[INST] <<SYS>>\n{SYSTEM_PROMPT}\n<</SYS>>\n\nBased on all the information provided, please provide a comprehensive medical assessment including likely diagnosis and recommendations for {conversation_state['name']}.\n\nPatient Information:\n{patient_info} [/INST] "
         inputs = tokenizer(diagnosis_prompt, return_tensors="pt").to(model.device)
         with torch.no_grad():
@@ -199,12 +227,15 @@ def generate_response(message, history):
         full_response = tokenizer.decode(outputs[0], skip_special_tokens=True)
         diagnosis = full_response.split('[/INST]')[-1].strip()
-        # Get treatment suggestions from Meditron
         treatment_suggestions = get_meditron_suggestions(patient_info)
         # Combine responses
         final_response = f"{diagnosis}\n\n--- TREATMENT RECOMMENDATIONS ---\n\n{treatment_suggestions}\n\n**Important:** These are general recommendations. Please consult with a healthcare professional for personalized medical advice."
         return final_response
 # Create the Gradio interface

 )
 print("Meditron model loaded successfully!")
+# Initialize LangChain memory for conversation tracking
+memory = ConversationBufferMemory(return_messages=True)
+# Simple state for basic info tracking
 conversation_state = {
     'name': None,
     'age': None,
     suggestion = meditron_tokenizer.decode(outputs[0][inputs.input_ids.shape[1]:], skip_special_tokens=True)
     return suggestion
+def build_prompt_with_memory(system_prompt, current_input):
+    """Build prompt using LangChain memory for full conversation context"""
     prompt = f"<s>[INST] <<SYS>>\n{system_prompt}\n<</SYS>>\n\n"
+    # Get conversation history from memory
+    messages = memory.chat_memory.messages
+    # Add conversation history to prompt
+    for msg in messages:
+        if msg.type == "human":
+            prompt += f"{msg.content} [/INST] "
+        elif msg.type == "ai":
+            prompt += f"{msg.content} </s><s>[INST] "
     # Add current input
     prompt += f"{current_input} [/INST] "
 @spaces.GPU
 def generate_response(message, history):
+    """Generate a response using LangChain ConversationBufferMemory."""
     global conversation_state
     # Reset state if this is a new conversation
             'has_name': False,
             'has_age': False
         }
+        # Clear memory for new conversation
+        memory.clear()
+    # Save current user message to memory (we'll save bot response later)
+    memory.save_context({"input": message}, {"output": ""})
     # Step 1: Ask for name if not provided
     if not conversation_state['has_name']:
         conversation_state['has_name'] = True
+        bot_response = "Hello! Before we discuss your health concerns, could you please tell me your name?"
+        # Update memory with bot response
+        memory.save_context({"input": message}, {"output": bot_response})
+        return bot_response
     # Step 2: Store name and ask for age
     if conversation_state['name'] is None:
         conversation_state['name'] = message.strip()
+        bot_response = f"Nice to meet you, {conversation_state['name']}! Could you please tell me your age?"
+        # Update memory with bot response
+        memory.save_context({"input": message}, {"output": bot_response})
+        return bot_response
     # Step 3: Store age and start medical questions
     if not conversation_state['has_age']:
         conversation_state['age'] = message.strip()
         conversation_state['has_age'] = True
+        bot_response = f"Thank you, {conversation_state['name']}! Now, what brings you here today? Please tell me about any symptoms or health concerns you're experiencing."
+        # Update memory with bot response
+        memory.save_context({"input": message}, {"output": bot_response})
+        return bot_response
+    # Step 4: Medical consultation phase using ConversationBufferMemory
     conversation_state['medical_turns'] += 1
+    # Build the prompt using memory for full conversation context
     if conversation_state['medical_turns'] <= 5:
         # Still gathering information - let LLM ask intelligent follow-up questions
+        prompt = build_prompt_with_memory(SYSTEM_PROMPT, message)
         # Generate response with intelligent follow-up questions
         inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
         full_response = tokenizer.decode(outputs[0], skip_special_tokens=True)
         llama_response = full_response.split('[/INST]')[-1].strip()
+        # Save bot response to memory
+        memory.save_context({"input": message}, {"output": llama_response})
         return llama_response
     else:
         # Time for diagnosis and treatment (after 5+ turns)
+        # Get all conversation messages from memory
+        all_messages = memory.chat_memory.messages
+        # Compile patient information from memory
         patient_info = f"Patient: {conversation_state['name']}, Age: {conversation_state['age']}\n\n"
+        patient_info += "Complete Conversation History:\n"
+        # Add all messages from memory
+        for msg in all_messages:
+            if msg.type == "human":
+                patient_info += f"Patient: {msg.content}\n"
+            elif msg.type == "ai":
+                patient_info += f"Doctor: {msg.content}\n"
+        patient_info += f"Current: {message}\n"
+        # Generate diagnosis with full conversation context
+        diagnosis_prompt = f"<s>[INST] <<SYS>>\n{SYSTEM_PROMPT}\n<</SYS>>\n\nBased on the complete conversation history, please provide a comprehensive medical assessment including likely diagnosis and recommendations for {conversation_state['name']}.\n\nComplete Patient Information:\n{patient_info} [/INST] "
         inputs = tokenizer(diagnosis_prompt, return_tensors="pt").to(model.device)
         with torch.no_grad():
         full_response = tokenizer.decode(outputs[0], skip_special_tokens=True)
         diagnosis = full_response.split('[/INST]')[-1].strip()
+        # Get treatment suggestions from Meditron using memory context
         treatment_suggestions = get_meditron_suggestions(patient_info)
         # Combine responses
         final_response = f"{diagnosis}\n\n--- TREATMENT RECOMMENDATIONS ---\n\n{treatment_suggestions}\n\n**Important:** These are general recommendations. Please consult with a healthcare professional for personalized medical advice."
+        # Save final response to memory
+        memory.save_context({"input": message}, {"output": final_response})
         return final_response
 # Create the Gradio interface