Spaces:

Triok1
/

metaGenerator

Sleeping

App Files Files Community

Triok1 commited on May 11

Commit

05c8c2e

verified ·

1 Parent(s): 82152ba

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -67

app.py CHANGED Viewed

@@ -1,73 +1,39 @@
-from transformers import AutoTokenizer, T5ForConditionalGeneration
-import torch
 import gradio as gr
-import re
-tokenizer = AutoTokenizer.from_pretrained("cointegrated/rut5-base-multitask", legacy=False)
-model = T5ForConditionalGeneration.from_pretrained("cointegrated/rut5-base-multitask")
-def smart_truncate(text, max_len):
-    if len(text) <= max_len:
-        return text
-    return text[:text[:max_len+1].rfind(' ')].strip()
-def generate_meta(description):
-    # Очищаем входное описание
-    description = description.strip()
-    # Теперь безопасный f-string без .strip() внутри
-    prompt = """
-Create a title and description for product page.
-Product name: Fenix ARB-L18-4000U
-Description: {description}
-Output format:
-{{"title": "SEO заголовок до 60 символов", "description": "SEO описание до 160 символов"}}
-""".format(description=description)
     inputs = tokenizer(prompt, return_tensors="pt", max_length=512, truncation=True)
-    with torch.no_grad():
-        outputs = model.generate(
-            **inputs,
-            max_new_tokens=200,
-            num_beams=5,
-            early_stopping=True,
-            no_repeat_ngram_size=2
-        )
-    try:
-        result = tokenizer.decode(outputs[0], skip_special_tokens=True)
-        json_match = re.search(r'\{.*\}', result, re.DOTALL)
-        if json_match:
-            json_data = json.loads(json_match.group())
-            title = smart_truncate(json_data.get("title", ""), 60)
-            desc = smart_truncate(json_data.get("description", ""), 160)
-        else:
-            clean_text = re.sub(r'\s+', ' ', description)
-            title = smart_truncate(f"Аккумулятор Fenix {clean_text}", 60)
-            desc = smart_truncate(clean_text, 160)
-    except Exception as e:
-        clean_text = re.sub(r'\s+', ' ', description)
-        title = smart_truncate(f"Аккумулятор Fenix {clean_text}", 60)
-        desc = smart_truncate(clean_text, 160)
-    return title, desc
-# Интерфейс
-with gr.Blocks() as app:
-    gr.Markdown("## Генератор метатегов (контроль длины)")
-    inp = gr.Textbox(label="Описание товара", lines=7)
-    btn = gr.Button("Сгенерировать")
-    with gr.Row():
-        out_title = gr.Textbox(label="Title (до 60)", interactive=False)
-        out_desc = gr.Textbox(label="Description (до 160)", lines=3, interactive=False)
-    btn.click(fn=generate_meta, inputs=inp, outputs=[out_title, out_desc])
-app.launch()

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
+# Загружаем модель и токенайзер
+model_name = "cointegrated/rut5-base-summarization"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
+def generate_meta_description(product_description):
+    prompt = f"Сгенерируй meta description (до 160 символов) по следующему описанию товара: {product_description}"
     inputs = tokenizer(prompt, return_tensors="pt", max_length=512, truncation=True)
+    summary_ids = model.generate(
+        inputs["input_ids"],
+        max_length=60,  # приблизительно ~160 символов на русском
+        num_beams=4,
+        no_repeat_ngram_size=2,
+        early_stopping=True
+    )
+    summary = tokenizer.decode(summary_ids[0], skip_special_tokens=True)
+    # обрезаем аккуратно, чтобы не обрывать слова
+    if len(summary) > 160:
+        truncated = summary[:160]
+        last_space = truncated.rfind(' ')
+        summary = truncated[:last_space]
+    return summary.strip()
+iface = gr.Interface(
+    fn=generate_meta_description,
+    inputs=gr.Textbox(label="Описание товара", lines=5, placeholder="Например: Красивое мужское пальто из шерсти..."),
+    outputs=gr.Textbox(label="Meta Description (до 160 символов)"),
+    title="Meta Description генератор (русский)",
+    description="Генерирует логичный и краткий meta description по описанию товара (до 160 символов, без обрезания слов)."
+)
+if __name__ == "__main__":
+    iface.launch()