quickprep / app.py
ragul2607's picture
Update app.py
87d6326 verified
raw
history blame
712 Bytes
from fastapi import FastAPI, Request, HTTPException
import requests
import os
from pydantic import BaseModel
app = FastAPI()
API_URL = "https://api-inference.huggingface.co/models/meta-llama/Meta-Llama-3-8B-Instruct"
HF_TOKEN = os.getenv("HF_API_KEY") # Load from environment variable
headers = {"Authorization": f"Bearer {HF_TOKEN}"}
class PromptRequest(BaseModel):
prompt: str
@app.post("/generate")
async def generate_text(data: PromptRequest):
try:
response = requests.post(API_URL, headers=headers, json={"inputs": data.prompt})
response.raise_for_status()
return response.json()
except Exception as e:
raise HTTPException(status_code=500, detail=str(e))