thecollabagepatch commited on
Commit
718a38c
·
1 Parent(s): 6d4a711

jax fixings

Browse files
Files changed (1) hide show
  1. Dockerfile +5 -2
Dockerfile CHANGED
@@ -30,10 +30,10 @@ RUN set -eux; \
30
  ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
31
 
32
  # Better allocator (less fragmentation than BFC during XLA autotune)
33
- # ENV TF_GPU_ALLOCATOR=cuda_malloc_async
34
 
35
  # Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
36
- # ENV TF_ENABLE_CUBLAS_TF32=1 NVIDIA_TF32_OVERRIDE=1
37
 
38
  ENV DEBIAN_FRONTEND=noninteractive \
39
  PYTHONUNBUFFERED=1 \
@@ -128,6 +128,9 @@ RUN python -m pip install --no-cache-dir --force-reinstall "protobuf==4.25.3"
128
 
129
  RUN python -m pip install gradio
130
 
 
 
 
131
  # Switch to Spaces’ preferred user
132
  # Switch to Spaces’ preferred user
133
  RUN useradd -m -u 1000 appuser
 
30
  ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
31
 
32
  # Better allocator (less fragmentation than BFC during XLA autotune)
33
+ ENV TF_GPU_ALLOCATOR=cuda_malloc_async
34
 
35
  # Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
36
+ ENV TF_ENABLE_CUBLAS_TF32=1 NVIDIA_TF32_OVERRIDE=1
37
 
38
  ENV DEBIAN_FRONTEND=noninteractive \
39
  PYTHONUNBUFFERED=1 \
 
128
 
129
  RUN python -m pip install gradio
130
 
131
+ RUN python -m pip install --no-cache-dir --force-reinstall \
132
+ "jax==0.7.1" "jaxlib==0.7.1" "jax[cuda12]==0.7.1"
133
+
134
  # Switch to Spaces’ preferred user
135
  # Switch to Spaces’ preferred user
136
  RUN useradd -m -u 1000 appuser