Spaces:

SimrusDenuvo
/

chat

Sleeping

App Files Files Community

chat / app.py

SimrusDenuvo

Update app.py

d1231ce verified 4 months ago

raw

history blame

4.33 kB

	import gradio as gr
	import time
	from transformers import pipeline

	# Инициализация моделей (CPU-совместимые)
	models = {
	"ChatGPT-like": pipeline(
	"text-generation",
	model="IlyaGusev/saiga_mistral_7b_text",
	tokenizer="IlyaGusev/saiga_mistral_7b_text",
	device=-1
	),
	"DeepSeek-like": pipeline(
	"text-generation",
	model="deepseek-ai/DeepSeek-Coder-1.3B-instruct",
	tokenizer="deepseek-ai/DeepSeek-Coder-1.3B-instruct",
	device=-1
	),
	"GigaChat-like": pipeline(
	"text-generation",
	model="tinkoff-ai/ruGPT3Large",
	tokenizer="tinkoff-ai/ruGPT3Large",
	device=-1
	)
	}

	# Обычный промпт
	def build_simple_prompt(user_input):
	return f"Клиент: {user_input}\nКатегория обращения:"

	# Промпт с рассуждением
	def build_cot_prompt(user_input):
	return (
	f"Клиент: {user_input}\n"
	"Проанализируй обращение клиента пошагово:\n"
	"1. В чём проблема?\n"
	"2. Почему она возникла?\n"
	"3. Как это можно решить?\n"
	"Выведи итог: Категория обращения:"
	)

	# Генерация
	def generate_classification(user_input):
	prompt_simple = build_simple_prompt(user_input)
	prompt_cot = build_cot_prompt(user_input)

	results = {}

	for name, pipe in models.items():
	# CoT
	start_cot = time.time()
	cot_output = pipe(prompt_cot, max_new_tokens=150, do_sample=True, top_p=0.9, temperature=0.7)[0]["generated_text"]
	end_cot = round(time.time() - start_cot, 2)

	# Simple
	start_simple = time.time()
	simple_output = pipe(prompt_simple, max_new_tokens=80, do_sample=True, top_p=0.9, temperature=0.7)[0]["generated_text"]
	end_simple = round(time.time() - start_simple, 2)

	results[name] = {
	"cot_answer": cot_output.strip(),
	"cot_time": end_cot,
	"simple_answer": simple_output.strip(),
	"simple_time": end_simple
	}

	return (
	results["ChatGPT-like"]["cot_answer"], f"{results['ChatGPT-like']['cot_time']} сек",
	results["ChatGPT-like"]["simple_answer"], f"{results['ChatGPT-like']['simple_time']} сек",
	results["DeepSeek-like"]["cot_answer"], f"{results['DeepSeek-like']['cot_time']} сек",
	results["DeepSeek-like"]["simple_answer"], f"{results['DeepSeek-like']['simple_time']} сек",
	results["GigaChat-like"]["cot_answer"], f"{results['GigaChat-like']['cot_time']} сек",
	results["GigaChat-like"]["simple_answer"], f"{results['GigaChat-like']['simple_time']} сек"
	)

	# Gradio интерфейс
	with gr.Blocks() as demo:
	gr.Markdown("## 🧠 Сравнение моделей (ChatGPT, DeepSeek, GigaChat) по классификации клиентских обращений")

	inp = gr.Textbox(label="Вопрос клиента", placeholder="Например: Я не могу перевести деньги", lines=2)
	btn = gr.Button("Сгенерировать")

	# ChatGPT-like
	gr.Markdown("### ChatGPT-like (Saiga Mistral)")
	cot1 = gr.Textbox(label="CoT ответ")
	cot1_time = gr.Textbox(label="Время CoT")
	simple1 = gr.Textbox(label="Обычный ответ")
	simple1_time = gr.Textbox(label="Время обычного")

	# DeepSeek-like
	gr.Markdown("### DeepSeek-like")
	cot2 = gr.Textbox(label="CoT ответ")
	cot2_time = gr.Textbox(label="Время CoT")
	simple2 = gr.Textbox(label="Обычный ответ")
	simple2_time = gr.Textbox(label="Время обычного")

	# GigaChat-like
	gr.Markdown("### GigaChat-like (ruGPT3Large)")
	cot3 = gr.Textbox(label="CoT ответ")
	cot3_time = gr.Textbox(label="Время CoT")
	simple3 = gr.Textbox(label="Обычный ответ")
	simple3_time = gr.Textbox(label="Время обычного")

	btn.click(generate_classification, inputs=[inp], outputs=[
	cot1, cot1_time, simple1, simple1_time,
	cot2, cot2_time, simple2, simple2_time,
	cot3, cot3_time, simple3, simple3_time
	])

	demo.launch()