Spaces:
Running
Running
add "Q4_K_M" precision
Browse files
app.py
CHANGED
@@ -21,7 +21,7 @@ MODELS = {
|
|
21 |
"clip_repo": "ggml-org/SmolVLM2-256M-Video-Instruct-GGUF",
|
22 |
"model_prefix": "SmolVLM2-256M-Video-Instruct",
|
23 |
"clip_prefix": "mmproj-SmolVLM2-256M-Video-Instruct",
|
24 |
-
"model_variants": ["f16", "Q8_0", "Q2_K", ],
|
25 |
"clip_variants": ["f16", "Q8_0", ],
|
26 |
},
|
27 |
"500M": {
|
@@ -29,7 +29,7 @@ MODELS = {
|
|
29 |
"clip_repo": "ggml-org/SmolVLM2-500M-Video-Instruct-GGUF",
|
30 |
"model_prefix": "SmolVLM2-500M-Video-Instruct",
|
31 |
"clip_prefix": "mmproj-SmolVLM2-500M-Video-Instruct",
|
32 |
-
"model_variants": ["Q8_0", "Q2_K", "f16"],
|
33 |
"clip_variants": ["Q8_0", "f16"],
|
34 |
},
|
35 |
"2.2B": {
|
@@ -37,7 +37,7 @@ MODELS = {
|
|
37 |
"clip_repo": "ggml-org/SmolVLM2-2.2B-Instruct-GGUF",
|
38 |
"model_prefix": "SmolVLM2-2.2B-Instruct",
|
39 |
"clip_prefix": "mmproj-SmolVLM2-2.2B-Instruct",
|
40 |
-
"model_variants": ["Q8_0", "Q2_K","Q4_K_M", "f16"],
|
41 |
"clip_variants": ["Q8_0", "f16"],
|
42 |
},
|
43 |
}
|
|
|
21 |
"clip_repo": "ggml-org/SmolVLM2-256M-Video-Instruct-GGUF",
|
22 |
"model_prefix": "SmolVLM2-256M-Video-Instruct",
|
23 |
"clip_prefix": "mmproj-SmolVLM2-256M-Video-Instruct",
|
24 |
+
"model_variants": ["Q4_K_M", "f16", "Q8_0", "Q2_K", ],
|
25 |
"clip_variants": ["f16", "Q8_0", ],
|
26 |
},
|
27 |
"500M": {
|
|
|
29 |
"clip_repo": "ggml-org/SmolVLM2-500M-Video-Instruct-GGUF",
|
30 |
"model_prefix": "SmolVLM2-500M-Video-Instruct",
|
31 |
"clip_prefix": "mmproj-SmolVLM2-500M-Video-Instruct",
|
32 |
+
"model_variants": ["Q4_K_M", "Q8_0", "Q2_K", "f16"],
|
33 |
"clip_variants": ["Q8_0", "f16"],
|
34 |
},
|
35 |
"2.2B": {
|
|
|
37 |
"clip_repo": "ggml-org/SmolVLM2-2.2B-Instruct-GGUF",
|
38 |
"model_prefix": "SmolVLM2-2.2B-Instruct",
|
39 |
"clip_prefix": "mmproj-SmolVLM2-2.2B-Instruct",
|
40 |
+
"model_variants": ["Q4_K_M", "Q8_0", "Q2_K","Q4_K_M", "f16"],
|
41 |
"clip_variants": ["Q8_0", "f16"],
|
42 |
},
|
43 |
}
|