chat / app.py
SimrusDenuvo's picture
Update app.py
57645e8 verified
raw
history blame
1.28 kB
from transformers import AutoTokenizer, AutoModelForCausalLM
import torch
import gradio as gr
model_name = "ai-forever/rugpt3large_based_on_gpt2"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(model_name)
def generate_response(user_query):
prompt = f"Клиент: {user_query}\nБанк:"
input_ids = tokenizer.encode(prompt, return_tensors="pt")
with torch.no_grad():
output_ids = model.generate(
input_ids,
max_new_tokens=100,
do_sample=True,
temperature=0.7,
top_k=50,
top_p=0.95,
pad_token_id=tokenizer.eos_token_id
)
generated_text = tokenizer.decode(output_ids[0], skip_special_tokens=True)
response = generated_text[len(prompt):].strip()
return response
gr.Interface(
fn=generate_response,
inputs=gr.Textbox(lines=3, label="Введите банковский запрос"),
outputs=gr.Textbox(lines=5, label="Ответ модели"),
title="🤖 Русский банковский помощник",
description="Генерация ответа на русском языке с использованием модели RuGPT-3 от AI-Forever."
).launch(share=True)