Commit
·
718a38c
1
Parent(s):
6d4a711
jax fixings
Browse files- Dockerfile +5 -2
Dockerfile
CHANGED
@@ -30,10 +30,10 @@ RUN set -eux; \
|
|
30 |
ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
|
31 |
|
32 |
# Better allocator (less fragmentation than BFC during XLA autotune)
|
33 |
-
|
34 |
|
35 |
# Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
|
36 |
-
|
37 |
|
38 |
ENV DEBIAN_FRONTEND=noninteractive \
|
39 |
PYTHONUNBUFFERED=1 \
|
@@ -128,6 +128,9 @@ RUN python -m pip install --no-cache-dir --force-reinstall "protobuf==4.25.3"
|
|
128 |
|
129 |
RUN python -m pip install gradio
|
130 |
|
|
|
|
|
|
|
131 |
# Switch to Spaces’ preferred user
|
132 |
# Switch to Spaces’ preferred user
|
133 |
RUN useradd -m -u 1000 appuser
|
|
|
30 |
ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
|
31 |
|
32 |
# Better allocator (less fragmentation than BFC during XLA autotune)
|
33 |
+
ENV TF_GPU_ALLOCATOR=cuda_malloc_async
|
34 |
|
35 |
# Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
|
36 |
+
ENV TF_ENABLE_CUBLAS_TF32=1 NVIDIA_TF32_OVERRIDE=1
|
37 |
|
38 |
ENV DEBIAN_FRONTEND=noninteractive \
|
39 |
PYTHONUNBUFFERED=1 \
|
|
|
128 |
|
129 |
RUN python -m pip install gradio
|
130 |
|
131 |
+
RUN python -m pip install --no-cache-dir --force-reinstall \
|
132 |
+
"jax==0.7.1" "jaxlib==0.7.1" "jax[cuda12]==0.7.1"
|
133 |
+
|
134 |
# Switch to Spaces’ preferred user
|
135 |
# Switch to Spaces’ preferred user
|
136 |
RUN useradd -m -u 1000 appuser
|