Luigi commited on
Commit
5a94240
·
1 Parent(s): 5fc1115

default f16 precision

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -21,15 +21,15 @@ MODELS = {
21
  "clip_repo": "ggml-org/SmolVLM2-256M-Video-Instruct-GGUF",
22
  "model_prefix": "SmolVLM2-256M-Video-Instruct",
23
  "clip_prefix": "mmproj-SmolVLM2-256M-Video-Instruct",
24
- "model_variants": ["Q4_K_M", "f16", "Q8_0", "Q2_K", ],
25
- "clip_variants": ["f16", "Q8_0", ],
26
  },
27
  "500M": {
28
  "model_repo": "mradermacher/SmolVLM2-500M-Video-Instruct-GGUF",
29
  "clip_repo": "ggml-org/SmolVLM2-500M-Video-Instruct-GGUF",
30
  "model_prefix": "SmolVLM2-500M-Video-Instruct",
31
  "clip_prefix": "mmproj-SmolVLM2-500M-Video-Instruct",
32
- "model_variants": ["Q4_K_M", "Q8_0", "Q2_K", "f16"],
33
  "clip_variants": ["Q8_0", "f16"],
34
  },
35
  "2.2B": {
@@ -37,7 +37,7 @@ MODELS = {
37
  "clip_repo": "ggml-org/SmolVLM2-2.2B-Instruct-GGUF",
38
  "model_prefix": "SmolVLM2-2.2B-Instruct",
39
  "clip_prefix": "mmproj-SmolVLM2-2.2B-Instruct",
40
- "model_variants": ["Q4_K_M", "Q8_0", "Q2_K", "f16"],
41
  "clip_variants": ["Q8_0", "f16"],
42
  },
43
  }
 
21
  "clip_repo": "ggml-org/SmolVLM2-256M-Video-Instruct-GGUF",
22
  "model_prefix": "SmolVLM2-256M-Video-Instruct",
23
  "clip_prefix": "mmproj-SmolVLM2-256M-Video-Instruct",
24
+ "model_variants": ["f16", "Q8_0", "Q2_K", "Q4_K_M"],
25
+ "clip_variants": ["Q8_0", "f16"],
26
  },
27
  "500M": {
28
  "model_repo": "mradermacher/SmolVLM2-500M-Video-Instruct-GGUF",
29
  "clip_repo": "ggml-org/SmolVLM2-500M-Video-Instruct-GGUF",
30
  "model_prefix": "SmolVLM2-500M-Video-Instruct",
31
  "clip_prefix": "mmproj-SmolVLM2-500M-Video-Instruct",
32
+ "model_variants": ["f16", "Q4_K_M", "Q8_0", "Q2_K"],
33
  "clip_variants": ["Q8_0", "f16"],
34
  },
35
  "2.2B": {
 
37
  "clip_repo": "ggml-org/SmolVLM2-2.2B-Instruct-GGUF",
38
  "model_prefix": "SmolVLM2-2.2B-Instruct",
39
  "clip_prefix": "mmproj-SmolVLM2-2.2B-Instruct",
40
+ "model_variants": ["f16", "Q4_K_M", "Q8_0", "Q2_K"],
41
  "clip_variants": ["Q8_0", "f16"],
42
  },
43
  }