Spaces:

prd101-wd
/

model_testing

Sleeping

App Files Files Community

model_testing / src /model_consumer.py

prd101-wd

Update src/model_consumer.py

6a947f8 verified 3 months ago

raw

history blame contribute delete

1.94 kB

	import streamlit as st
	from transformers import pipeline

	# model repo ID
	model_id = "prd101-wd/phi1_5-bankingqa-merged"

	# Load model only once
	@st.cache_resource
	def load_model():
	#return pipeline("question-answering", model=model_id)
	return pipeline("text-generation", model=model_id, trust_remote_code=True)

	# Create a text generation pipeline
	pipe = load_model()

	# Streamlit UI
	st.title("Banking HelpDesk from Finetuned Phi1-5")

	st.markdown("Ask a question and the fine-tuned Phi-1.5 model will answer.")

	user_input = st.text_area("Your question:", height=100)

	if st.button("Ask"):
	if user_input.strip():
	# Format the prompt like Alpaca-style
	prompt = f"### Instruction:\n{user_input}\n\n### Response:\n"
	output = pipe(prompt, max_new_tokens=200, do_sample=True, temperature=0.7)

	# Process output
	if isinstance(output, list) and output:
	answer = output[0]['generated_text']
	# Extract only the response part
	if "### Response:" in answer:
	answer = answer.split("### Response:")[-1].strip()
	else:
	answer = "Unable to generate a response. Please try again."



	# if isinstance(output, list) and len(output) > 0 and "generated_text" in output[0]:
	# answer = output[0]["generated_text"]
	# else:
	# answer = "Unable to generate a response. Please try again."

	# Extract only the model's response (remove prompt part if included in output)
	#answer = output.split("### Response:")[-1].strip()
	# if isinstance(output, str):
	# answer = output.split("### Response:")[-1].strip()
	# else:
	# answer = "Unexpected output format. Please try again."

	st.markdown("### HelpdeskBot Answer:")
	st.success(answer)
	else:
	st.warning("Please enter a question.")