Spaces:
Running
Running
import gradio as gr | |
import requests | |
def talk_to_llama(prompt): | |
url = "https://api.nvcf.nvidia.com/v2/completions" | |
headers = { | |
"Authorization": "Bearer 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", | |
"Content-Type": "application/json" | |
} | |
data = { | |
"messages": [{"role": "user", "content": prompt}] | |
} | |
response = requests.post(url, headers=headers, json=data) | |
return response.json()["choices"][0]["message"]["content"] | |
chat = gr.Interface(fn=talk_to_llama, inputs="text", outputs="text", title="Chat with LLaMA 4 Scout") | |
chat.launch() |