model="wizardLM-7B-GGML/wizardLM-7B.ggmlv3.q4_0.bin" use_mmap="True" use_mlock="True" n_threads="6" n_ctx="1024" n_gpu_layers="40" docs_url="/"