Spaces:

yusufs
/

llama32-3b-instruct

Running on T4

yusufs commited on 17 days ago

Commit

344825e

verified ·

1 Parent(s): 3044680

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,5 +1,7 @@
 FROM nvidia/cuda:11.7.1-cudnn8-runtime-ubuntu22.04
 RUN apt-get update && apt-get install -y python3 python3-pip git
 RUN pip3 install --upgrade pip
@@ -22,8 +24,7 @@ RUN pip3 install vllm==0.10.0 --extra-index-url https://download.pytorch.org/whl
 EXPOSE 7860
-CMD export VLLM_LOGGING_LEVEL=DEBUG && \
-  python3 -m vllm.entrypoints.openai.api_server \
   --model "meta-llama/Llama-3.2-3B-Instruct" \
   --task generate \
   --revision "0cb88a4f764b7a12671c53f0838cd831a0843b95" \

 FROM nvidia/cuda:11.7.1-cudnn8-runtime-ubuntu22.04
+ENV VLLM_LOGGING_LEVEL=DEBUG
 RUN apt-get update && apt-get install -y python3 python3-pip git
 RUN pip3 install --upgrade pip
 EXPOSE 7860
+CMD python3 -m vllm.entrypoints.openai.api_server \
   --model "meta-llama/Llama-3.2-3B-Instruct" \
   --task generate \
   --revision "0cb88a4f764b7a12671c53f0838cd831a0843b95" \