Spaces:

BaoKhuong
/

DeepSeek-R1-Distill-Qwen-14B

Build error

BaoKhuong commited on Sep 25

Commit

b92ef69

verified ·

1 Parent(s): 6a696b5

Update model.py

Files changed (1) hide show

model.py CHANGED Viewed

@@ -104,7 +104,7 @@ def get_finance_llama_pipeline():
 	# Configure llama.cpp loader
 	threads = int(os.getenv("LLAMA_THREADS", str(os.cpu_count() or 2)))
-	ctx = int(os.getenv("LLAMA_CTX", "4096")) #Mặc định 2048 -> 1024
 	batch = int(os.getenv("LLAMA_BATCH", "64")) #Mặc định 128 -> 64
 	use_mmap = os.getenv("LLAMA_MMAP", "1") in {"1","true","True","yes"}
 	use_mlock = os.getenv("LLAMA_MLOCK", "0") in {"1","true","True","yes"}

 	# Configure llama.cpp loader
 	threads = int(os.getenv("LLAMA_THREADS", str(os.cpu_count() or 2)))
+	ctx = int(os.getenv("LLAMA_CTX", "131072")) #Mặc định 2048 -> 1024
 	batch = int(os.getenv("LLAMA_BATCH", "64")) #Mặc định 128 -> 64
 	use_mmap = os.getenv("LLAMA_MMAP", "1") in {"1","true","True","yes"}
 	use_mlock = os.getenv("LLAMA_MLOCK", "0") in {"1","true","True","yes"}