Oleg Shulyakov commited on
Commit
fca7ea4
·
1 Parent(s): c1ffdc3

Add F16 and BF16 quantization

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -332,7 +332,7 @@ model_id = HuggingfaceHubSearch(
332
  )
333
 
334
  q_method = gr.Dropdown(
335
- ["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0"],
336
  label="Quantization Method",
337
  info="GGML quantization type",
338
  value="Q4_K_M",
 
332
  )
333
 
334
  q_method = gr.Dropdown(
335
+ ["Q2_K", "Q3_K_S", "Q3_K_M", "Q3_K_L", "Q4_0", "Q4_K_S", "Q4_K_M", "Q5_0", "Q5_K_S", "Q5_K_M", "Q6_K", "Q8_0", "F16", "BF16"],
336
  label="Quantization Method",
337
  info="GGML quantization type",
338
  value="Q4_K_M",