from transformers import pipeline | |
import gradio as gr | |
import torch | |
pipe = pipeline( | |
"text-generation", | |
model="meta-llama/Meta-Llama-3-8B-Instruct", | |
torch_dtype=torch.float16, | |
device_map="auto" # Usa la GPU automáticamente si está disponible | |
) | |
def chat(prompt): | |
result = pipe(prompt, max_new_tokens=256, do_sample=True, temperature=0.7) | |
return result[0]['generated_text'] | |
demo = gr.Interface(fn=chat, inputs="text", outputs="text", title="Amside AI") | |
demo.launch() | |