ggml-mllm / config.json
matthoffner's picture
Update config.json
e453fb6 verified
raw
history blame
361 Bytes
{
"host": "0.0.0.0",
"port": 8080,
"models": [
{
"model": "llava-v1.6-mistral-7b.Q3_K_XS.gguf",
"model_alias": "llava-1.6",
"chat_format": "llava-1-5",
"clip_model_path": "mmproj-model-f16.gguf",
"n_gpu_layers": -1,
"offload_kqv": false,
"n_threads": 12,
"n_batch": 512,
"n_ctx": 2048
}
]
}