Spaces:
Sleeping
Sleeping
Oleg Shulyakov
commited on
Commit
·
fca7ea4
1
Parent(s):
c1ffdc3
Add F16 and BF16 quantization
Browse files
app.py
CHANGED
@@ -332,7 +332,7 @@ model_id = HuggingfaceHubSearch(
|
|
332 |
)
|
333 |
|
334 |
q_method = gr.Dropdown(
|
335 |
-
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0"],
|
336 |
label="Quantization Method",
|
337 |
info="GGML quantization type",
|
338 |
value="Q4_K_M",
|
|
|
332 |
)
|
333 |
|
334 |
q_method = gr.Dropdown(
|
335 |
+
["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16"],
|
336 |
label="Quantization Method",
|
337 |
info="GGML quantization type",
|
338 |
value="Q4_K_M",
|