dev-mode-orpheus

Paused

Tomtom84 commited on Apr 20

Commit

49ee602

verified ·

1 Parent(s): efa5012

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,9 +1,13 @@
-# GPU‑fertige Basis mit Python 3.10, CUDA 11.8, cuDNN 8
-FROM pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime
 # System‑Tools (schlank halten!)
 RUN apt-get update && \
-    apt-get install -y git-lfs build-essential && \
     rm -rf /var/lib/apt/lists/*
 # Non‑root‑User, weil Spaces das mögen
@@ -20,7 +24,8 @@ RUN pip install --upgrade pip && \
 # Optional: flash‑attn (Ampere 86 wird erkannt, Wheel vorhanden)
 # fertiges Wheel laden (kein nvcc)
-RUN pip install --no-cache-dir "flash-attn>=2.6.3,<=2.7" --extra-index-url https://download.pytorch.org/whl/cu118
 # Mount das geheime HF‑Token beim Build:
 #   Settings → Secrets → Name: HF_TOKEN  (scope: "read")

+# GPU‑fertige Basis mit Python 3.10, CUDA 12.1, cuDNN 8
+FROM pytorch/pytorch:2.2.2-cuda12.1-cudnn8-runtime   # ✔ Runtime‑Variante, 3.4 GB  :contentReference[oaicite:0]{index=0}
 # System‑Tools (schlank halten!)
 RUN apt-get update && \
+    apt-get install -y git-lfs build-essential bash \
+      git \
+      wget curl procps gnupg \
+      cmake \
+      htop vim nano && \
     rm -rf /var/lib/apt/lists/*
 # Non‑root‑User, weil Spaces das mögen
 # Optional: flash‑attn (Ampere 86 wird erkannt, Wheel vorhanden)
 # fertiges Wheel laden (kein nvcc)
+RUN pip install --no-cache-dir \
+    https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.2cxx11abiFALSE-cp310-cp310-linux_x86_64.whl
 # Mount das geheime HF‑Token beim Build:
 #   Settings → Secrets → Name: HF_TOKEN  (scope: "read")