ftanguy commited on
Commit
f6eda05
·
verified ·
1 Parent(s): b217346

Upload Qwen3ForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -52,7 +52,7 @@
52
  "_load_in_8bit": false,
53
  "bnb_4bit_compute_dtype": "bfloat16",
54
  "bnb_4bit_quant_storage": "uint8",
55
- "bnb_4bit_quant_type": "fp4",
56
  "bnb_4bit_use_double_quant": true,
57
  "llm_int8_enable_fp32_cpu_offload": false,
58
  "llm_int8_has_fp16_weight": false,
 
52
  "_load_in_8bit": false,
53
  "bnb_4bit_compute_dtype": "bfloat16",
54
  "bnb_4bit_quant_storage": "uint8",
55
+ "bnb_4bit_quant_type": "nf4",
56
  "bnb_4bit_use_double_quant": true,
57
  "llm_int8_enable_fp32_cpu_offload": false,
58
  "llm_int8_has_fp16_weight": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26fa213dbe8c09e525309ed9a346e28b1b6a2a9c89e82d7a6b199a2fed85ca57
3
  size 538883409
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe7b33f8c2434319b80eeae4adeea92b686976fd876f3bb593ed6c14688d621
3
  size 538883409