johnbridges commited on
Commit
6e03628
·
1 Parent(s): 5a4dfcf

.trying bf16 phi 4 mini

Browse files
Files changed (2) hide show
  1. Dockerfile +3 -3
  2. appsettings.json +1 -1
Dockerfile CHANGED
@@ -30,13 +30,13 @@ WORKDIR /home/user
30
  RUN mkdir -p /home/user/code/models && \
31
  mkdir -p /home/user/code/app/wwwroot && \
32
  cd /home/user/code/models && \
33
- wget -q https://huggingface.co/Mungert/Phi-4-mini-instruct.gguf/resolve/main/phi-4-mini-q4_0.gguf
34
 
35
 
36
  # Clone and build OpenBLAS as the non-root user
37
  RUN git clone https://github.com/OpenMathLib/OpenBLAS.git /home/user/code/models/OpenBLAS && \
38
  cd /home/user/code/models/OpenBLAS && \
39
- make -j$(nproc) > build.log 2>&1 || (tail -20 build.log && false)
40
 
41
  # Switch to root for the OpenBLAS installation
42
  USER root
@@ -52,7 +52,7 @@ RUN git clone https://github.com/ggerganov/llama.cpp /home/user/code/models/llam
52
  cd /home/user/code/models/llama.cpp && \
53
  export PKG_CONFIG_PATH=/opt/OpenBLAS/lib/pkgconfig:$PKG_CONFIG_PATHa && \
54
  cmake -B build -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DBLAS_INCLUDE_DIRS=/home/user/code/models/OpenBLAS -DLLAMA_CURL=OFF && \
55
- cmake --build build --config Release -j$(nproc) && \
56
  cp /home/user/code/models/llama.cpp/build/bin/* /home/user/code/models/llama.cpp/
57
 
58
 
 
30
  RUN mkdir -p /home/user/code/models && \
31
  mkdir -p /home/user/code/app/wwwroot && \
32
  cd /home/user/code/models && \
33
+ wget -q https://huggingface.co/Mungert/Phi-4-mini-instruct.gguf/resolve/main/phi-4-mini-bf16.gguf
34
 
35
 
36
  # Clone and build OpenBLAS as the non-root user
37
  RUN git clone https://github.com/OpenMathLib/OpenBLAS.git /home/user/code/models/OpenBLAS && \
38
  cd /home/user/code/models/OpenBLAS && \
39
+ make -j2 > build.log 2>&1 || (tail -20 build.log && false)
40
 
41
  # Switch to root for the OpenBLAS installation
42
  USER root
 
52
  cd /home/user/code/models/llama.cpp && \
53
  export PKG_CONFIG_PATH=/opt/OpenBLAS/lib/pkgconfig:$PKG_CONFIG_PATHa && \
54
  cmake -B build -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DBLAS_INCLUDE_DIRS=/home/user/code/models/OpenBLAS -DLLAMA_CURL=OFF && \
55
+ cmake --build build --config Release -j2 && \
56
  cp /home/user/code/models/llama.cpp/build/bin/* /home/user/code/models/llama.cpp/
57
 
58
 
appsettings.json CHANGED
@@ -23,7 +23,7 @@
23
  "LlmNoInitMessage" : false,
24
  "ServiceAuthKey" : ".env" ,
25
  "LlmModelPath" : "/home/user/code/models/",
26
- "LlmModelFileName" : "phi-4-mini-q4_0.gguf",
27
  "LlmContextFileName" : "context-phi-4-mini.gguf",
28
  "LlmSystemPrompt" : "system_prompt_phi_4_mini_run",
29
  "LlmPromptMode" : " -if -sp -no-cnv --simple-io ",
 
23
  "LlmNoInitMessage" : false,
24
  "ServiceAuthKey" : ".env" ,
25
  "LlmModelPath" : "/home/user/code/models/",
26
+ "LlmModelFileName" : "phi-4-mini-bf16.gguf",
27
  "LlmContextFileName" : "context-phi-4-mini.gguf",
28
  "LlmSystemPrompt" : "system_prompt_phi_4_mini_run",
29
  "LlmPromptMode" : " -if -sp -no-cnv --simple-io ",