Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -7,6 +7,7 @@ app = FastAPI()
|
|
7 |
qwen3_gguf_llm = Llama.from_pretrained(
|
8 |
repo_id="unsloth/Qwen3-0.6B-GGUF",
|
9 |
filename="Qwen3-0.6B-UD-Q8_K_XL.gguf",
|
|
|
10 |
)
|
11 |
|
12 |
class PromptRequest(BaseModel):
|
|
|
7 |
qwen3_gguf_llm = Llama.from_pretrained(
|
8 |
repo_id="unsloth/Qwen3-0.6B-GGUF",
|
9 |
filename="Qwen3-0.6B-UD-Q8_K_XL.gguf",
|
10 |
+
n_threads=-1
|
11 |
)
|
12 |
|
13 |
class PromptRequest(BaseModel):
|