Spaces:
Paused
Paused
fix(using sail/Sailor2-3B-Chat): sail/Sailor2-3B-Chat
Browse files- Dockerfile +0 -2
- runner.sh +3 -11
Dockerfile
CHANGED
|
@@ -38,7 +38,5 @@ EXPOSE 7860
|
|
| 38 |
#CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]
|
| 39 |
|
| 40 |
RUN chmod +x /app/runner.sh
|
| 41 |
-
RUN chmod +x /app/run-llama.sh
|
| 42 |
-
RUN chmod +x /app/run-sailor.sh
|
| 43 |
|
| 44 |
CMD ["/app/runner.sh"]
|
|
|
|
| 38 |
#CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]
|
| 39 |
|
| 40 |
RUN chmod +x /app/runner.sh
|
|
|
|
|
|
|
| 41 |
|
| 42 |
CMD ["/app/runner.sh"]
|
runner.sh
CHANGED
|
@@ -13,16 +13,8 @@ case "$MODEL_ID" in
|
|
| 13 |
MODEL_REV="0cb88a4f764b7a12671c53f0838cd831a0843b95"
|
| 14 |
;;
|
| 15 |
2)
|
| 16 |
-
MODEL_NAME="sail/
|
| 17 |
-
MODEL_REV="
|
| 18 |
-
;;
|
| 19 |
-
3)
|
| 20 |
-
MODEL_NAME="DeepSeek-R1-Distill-Qwen-32B"
|
| 21 |
-
MODEL_REV="d66bcfc2f3fd52799f95943264f32ba15ca0003d"
|
| 22 |
-
;;
|
| 23 |
-
4)
|
| 24 |
-
MODEL_NAME="deepseek-ai/DeepSeek-V3"
|
| 25 |
-
MODEL_REV="1d044fd82b15f1cedb197a288e50cc96a2c27205"
|
| 26 |
;;
|
| 27 |
*)
|
| 28 |
echo "Error: Invalid MODEL_ID. Valid values are 1 or 2."
|
|
@@ -67,7 +59,7 @@ python -u /app/openai_compatible_api_server.py \
|
|
| 67 |
--port 7860 \
|
| 68 |
--max-num-batched-tokens 32768 \
|
| 69 |
--max-model-len 32768 \
|
| 70 |
-
--dtype
|
| 71 |
--enforce-eager \
|
| 72 |
--gpu-memory-utilization 0.9 \
|
| 73 |
--enable-prefix-caching \
|
|
|
|
| 13 |
MODEL_REV="0cb88a4f764b7a12671c53f0838cd831a0843b95"
|
| 14 |
;;
|
| 15 |
2)
|
| 16 |
+
MODEL_NAME="sail/Sailor2-3B-Chat"
|
| 17 |
+
MODEL_REV="d60722644e700133576489719dcbc288036628d5"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
;;
|
| 19 |
*)
|
| 20 |
echo "Error: Invalid MODEL_ID. Valid values are 1 or 2."
|
|
|
|
| 59 |
--port 7860 \
|
| 60 |
--max-num-batched-tokens 32768 \
|
| 61 |
--max-model-len 32768 \
|
| 62 |
+
--dtype bfloat16 \
|
| 63 |
--enforce-eager \
|
| 64 |
--gpu-memory-utilization 0.9 \
|
| 65 |
--enable-prefix-caching \
|