gouravbhadraDev commited on
Commit
ddad736
·
verified ·
1 Parent(s): 80c3a84

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -19,6 +19,6 @@ class GenerateResponse(BaseModel):
19
  @app.post("/generate/qwen3-0.6b-gguf", response_model=GenerateResponse)
20
  async def generate_qwen3_gguf_endpoint(request: PromptRequest):
21
  messages = [{"role": "user", "content": request.prompt}]
22
- response = qwen3_gguf_llm.create_chat_completion(messages=messages, max_tokens=256)
23
  generated_text = response['choices'][0]['message']['content']
24
  return GenerateResponse(generated_text=generated_text)
 
19
  @app.post("/generate/qwen3-0.6b-gguf", response_model=GenerateResponse)
20
  async def generate_qwen3_gguf_endpoint(request: PromptRequest):
21
  messages = [{"role": "user", "content": request.prompt}]
22
+ response = qwen3_gguf_llm.create_chat_completion(messages=messages)
23
  generated_text = response['choices'][0]['message']['content']
24
  return GenerateResponse(generated_text=generated_text)