gouravbhadraDev commited on
Commit
c7851f3
·
verified ·
1 Parent(s): e6978bd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -7,6 +7,7 @@ app = FastAPI()
7
  qwen3_gguf_llm = Llama.from_pretrained(
8
  repo_id="unsloth/Qwen3-0.6B-GGUF",
9
  filename="Qwen3-0.6B-UD-Q8_K_XL.gguf",
 
10
  )
11
 
12
  class PromptRequest(BaseModel):
 
7
  qwen3_gguf_llm = Llama.from_pretrained(
8
  repo_id="unsloth/Qwen3-0.6B-GGUF",
9
  filename="Qwen3-0.6B-UD-Q8_K_XL.gguf",
10
+ n_threads=-1
11
  )
12
 
13
  class PromptRequest(BaseModel):