File size: 838 Bytes
d75b820 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
from typing import Optional
from pydantic import BaseModel, Field
from fastapi import FastAPI, HTTPException
from contextlib import asynccontextmanager
from starlette.responses import FileResponse
class ConvertRequest(BaseModel):
hf_model_name: str
hf_token: Optional[str] = Field(None, description="Hugging Face token for private models")
@asynccontextmanager
async def lifespan(app:FastAPI):
yield
app = FastAPI(title="Huggingface Safetensor Model Converter to AWQ", version="0.1.0", lifespan=lifespan)
@app.get("/health")
def read_root():
return {"status": "ok"}
@app.post("/convert")
def convert(request: ConvertRequest)->FileResponse:
raise HTTPException(status_code=501, detail="Not Implemented yet")
#return FileResponse(file_location, media_type='application/octet-stream',filename=file_name) |