Spaces:
Paused
Paused
File size: 1,688 Bytes
ad94d02 f811c72 a4714da ab4421a 6458940 e4f3642 1105ae7 6458940 1cc945a e4f3642 97aa62e e4f3642 10df7bc e4f3642 ad94d02 abb092c 10df7bc e4f3642 3c4eebd 4536ba1 10df7bc 675256a 10df7bc 675256a ad94d02 1643d4d abb092c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
FROM python:3.12
#RUN pip install --no-cache-dir torch==2.2.2
#RUN pip install --no-cache-dir flash-attn
RUN apt-get update && \
apt-get install -y \
bash \
git git-lfs \
wget curl procps gnupg \
build-essential cmake \
htop vim nano && \
rm -rf /var/lib/apt/lists/*
# NVIDIA CUDA Keyring installieren (offizielle Methode seit 2024)
RUN wget https://developer.download.nvidia.com/compute/cuda/repos/debian12/x86_64/cuda-keyring_1.1-1_all.deb && \
dpkg -i cuda-keyring_1.1-1_all.deb && \
apt-get update && \
apt-get -y install cuda
# CUDA ENV-Variablen setzen
ENV PATH=/usr/local/cuda/bin:${PATH}
ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:${LD_LIBRARY_PATH}
ENV CUDAToolkit_ROOT=/usr/local/cuda
ENV CMAKE_ARGS="-DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=86"
RUN useradd -m -u 1000 user
USER user
ENV PATH="/home/user/.local/bin:$PATH"
# ^ when run as `user`, pip installs executables there
WORKDIR /app
COPY --chown=user . /app
# Wichtig: Isolation deaktivieren für llama-cpp-python Build
RUN pip install --upgrade pip
# Manuell Build-Werkzeuge bereitstellen
RUN pip install --no-cache-dir \
setuptools \
wheel \
scikit-build-core[pyproject]
# Optional: zuerst llama-cpp-python bauen (cachebar)
RUN pip install --no-cache-dir --no-build-isolation llama-cpp-python
# Danach: outetts (zieht llama-cpp-python nicht erneut)
RUN pip install --no-cache-dir --no-build-isolation outetts
RUN pip install --no-cache-dir -r requirements.txt
#CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", , "--ws", "auto", "--allow-websocket-origin", "*"]
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] |