Spaces:

Futuresony
/

FuturesonyAi

Runtime error

Futuresony commited on Feb 17

Commit

52eb24f

verified ·

1 Parent(s): acf9986

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,30 +1,19 @@
-import gradio as gr
-from huggingface_hub import InferenceClient
-client = InferenceClient("Futuresony/future_ai_12_10_2024.gguf")
 def respond(message, history, max_tokens, temperature, top_p):
-    """Generates only a short, direct response without extra text."""
     response = client.text_generation(
         message.strip(),
         max_new_tokens=max_tokens,
         temperature=temperature,
         top_p=top_p,
-    )
-    # ✅ Remove "I am... ", "What do you do?", "Can you help me...?", etc.
-    response = response.strip().split("\n")[0]  # Keep only the first line
-    yield response
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Slider(minimum=1, maximum=250, value=128, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"),
-    ],
-)
-if __name__ == "__main__":
-    demo.launch()

 def respond(message, history, max_tokens, temperature, top_p):
+    """Generate a response while preventing unnecessary repetition."""
+    # Ensure the message isn't directly repeated
+    if history and message.strip() == history[-1][0].strip():
+        return "Tafadhali uliza swali tofauti."  # Prevent direct repetition
     response = client.text_generation(
         message.strip(),
         max_new_tokens=max_tokens,
         temperature=temperature,
         top_p=top_p,
+    ).strip()
+    # Remove repeated input
+    if response.lower() == message.lower():
+        response = "Samahani, naweza kusaidia vipi?"
+    return response