Spaces:
Paused
Paused
Update Dockerfile
Browse files- Dockerfile +11 -0
Dockerfile
CHANGED
@@ -22,6 +22,10 @@ ENV VLLM_USE_TRITON_FLASH_ATTN=0
|
|
22 |
# Choose XFORMERS that most stable for T4
|
23 |
ENV VLLM_ATTENTION_BACKEND=XFORMERS
|
24 |
|
|
|
|
|
|
|
|
|
25 |
# Set environment variables to avoid interactive prompts
|
26 |
ENV DEBIAN_FRONTEND=noninteractive
|
27 |
|
@@ -51,6 +55,13 @@ RUN python3 --version && python3 -m pip --version
|
|
51 |
# RUN apt-get update && apt-get install -y python3 python3-pip git
|
52 |
# RUN pip install --upgrade pip
|
53 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
54 |
# Install vLLM
|
55 |
RUN pip install vllm==0.10.0 --extra-index-url https://download.pytorch.org/whl/cu113
|
56 |
|
|
|
22 |
# Choose XFORMERS that most stable for T4
|
23 |
ENV VLLM_ATTENTION_BACKEND=XFORMERS
|
24 |
|
25 |
+
# Set environment variables for the xformers build
|
26 |
+
ENV TORCH_CUDA_ARCH_LIST='7.0 7.5 8.0 8.9 9.0 10.0+PTX'
|
27 |
+
ENV MAX_JOBS=16
|
28 |
+
|
29 |
# Set environment variables to avoid interactive prompts
|
30 |
ENV DEBIAN_FRONTEND=noninteractive
|
31 |
|
|
|
55 |
# RUN apt-get update && apt-get install -y python3 python3-pip git
|
56 |
# RUN pip install --upgrade pip
|
57 |
|
58 |
+
# Install uv using pip
|
59 |
+
RUN pip install uv
|
60 |
+
|
61 |
+
# Install xformers using uv
|
62 |
+
RUN uv pip install --system \
|
63 |
+
--no-build-isolation "git+https://github.com/facebookresearch/xformers@v0.0.31"
|
64 |
+
|
65 |
# Install vLLM
|
66 |
RUN pip install vllm==0.10.0 --extra-index-url https://download.pytorch.org/whl/cu113
|
67 |
|