|
from fastapi import FastAPI, Request |
|
import requests |
|
import os |
|
|
|
app = FastAPI() |
|
|
|
API_URL = "https://api-inference.huggingface.co/models/meta-llama/Meta-Llama-3-8B-Instruct" |
|
HF_TOKEN = os.getenv("HF_API_KEY") |
|
headers = {"Authorization": f"Bearer {HF_TOKEN}"} |
|
|
|
|
|
@app.get("/") |
|
async def root(): |
|
return {"message": "β
QuickPrep is running!"} |
|
|
|
|
|
@app.post("/generate") |
|
async def generate(request: Request): |
|
data = await request.json() |
|
prompt = data.get("prompt") |
|
response = requests.post(API_URL, headers=headers, json={"inputs": prompt}) |
|
return response.json() |
|
|