{ "SchemaVersion": 1, "GeneratedUtc": "2026-05-12T03:07:11.9732721Z", "Generator": "MagicQuant", "SourceRepository": "magiccodingman/Qwen3.6-35B-A3B-MagicQuant-GGUF", "SourceJson": null, "SourceModelId": "mq-blake3:f5ea826f4ad276ba78a5e0c62417df1e42543230f648c33a50c2fbcc8b81d20c", "SourceArchitectureFamily": "Qwen3.6-35B-A3B", "Notes": "Exact GGUF tensor quantization map for repository clone/reproducibility mode. This file is not a proof that another cloned model went through the full MagicQuant evolution pipeline. External reference finalists use persisted SQLite learned tensor truth when no local final GGUF was exported.", "Artifacts": [ { "FileName": "Qwen3.6-35B-A3B-LM-Q8_0.gguf", "DisplayName": "LM-Q8_0", "ShortName": "LM-Q8_0", "Provider": "llama.cpp", "QuantFamily": "Q8_0", "BaseQuant": "Q8_0", "IsHybrid": false, "UsedImatrix": true, "SourceKld": 0.004654, "SourcePpl": 5.678789, "SourcePplDeltaPercent": -0.14438192368560207, "SourceSizeBytes": 36903139744, "SourceSizeGB": 36.903139744, "SourceSizeGiB": 34.36872711777687, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q8_0", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q8_0", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q8_0", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "Q8_0", "blk.0.ssm_beta.weight": "Q8_0", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q8_0", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q8_0", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q8_0", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "Q8_0", "blk.1.ssm_beta.weight": "Q8_0", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q8_0", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q8_0", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q8_0", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "Q8_0", "blk.10.ssm_beta.weight": "Q8_0", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q8_0", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q8_0", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q8_0", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q8_0", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q8_0", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q8_0", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "Q8_0", "blk.12.ssm_beta.weight": "Q8_0", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q8_0", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q8_0", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q8_0", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "Q8_0", "blk.13.ssm_beta.weight": "Q8_0", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q8_0", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q8_0", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q8_0", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "Q8_0", "blk.14.ssm_beta.weight": "Q8_0", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q8_0", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q8_0", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q8_0", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q8_0", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q8_0", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q8_0", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "Q8_0", "blk.16.ssm_beta.weight": "Q8_0", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q8_0", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q8_0", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q8_0", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "Q8_0", "blk.17.ssm_beta.weight": "Q8_0", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q8_0", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q8_0", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q8_0", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "Q8_0", "blk.18.ssm_beta.weight": "Q8_0", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q8_0", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q8_0", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q8_0", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q8_0", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q8_0", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q8_0", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "Q8_0", "blk.2.ssm_beta.weight": "Q8_0", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q8_0", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q8_0", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q8_0", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "Q8_0", "blk.20.ssm_beta.weight": "Q8_0", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q8_0", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q8_0", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q8_0", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "Q8_0", "blk.21.ssm_beta.weight": "Q8_0", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q8_0", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q8_0", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q8_0", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "Q8_0", "blk.22.ssm_beta.weight": "Q8_0", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q8_0", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q8_0", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q8_0", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q8_0", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q8_0", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q8_0", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "Q8_0", "blk.24.ssm_beta.weight": "Q8_0", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q8_0", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q8_0", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q8_0", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "Q8_0", "blk.25.ssm_beta.weight": "Q8_0", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q8_0", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q8_0", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q8_0", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "Q8_0", "blk.26.ssm_beta.weight": "Q8_0", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q8_0", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q8_0", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q8_0", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q8_0", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q8_0", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q8_0", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "Q8_0", "blk.28.ssm_beta.weight": "Q8_0", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q8_0", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q8_0", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q8_0", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "Q8_0", "blk.29.ssm_beta.weight": "Q8_0", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q8_0", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q8_0", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q8_0", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q8_0", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q8_0", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q8_0", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "Q8_0", "blk.30.ssm_beta.weight": "Q8_0", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q8_0", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q8_0", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q8_0", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q8_0", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q8_0", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q8_0", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "Q8_0", "blk.32.ssm_beta.weight": "Q8_0", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q8_0", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q8_0", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q8_0", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "Q8_0", "blk.33.ssm_beta.weight": "Q8_0", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q8_0", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q8_0", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q8_0", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "Q8_0", "blk.34.ssm_beta.weight": "Q8_0", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q8_0", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q8_0", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q8_0", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q8_0", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q8_0", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q8_0", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "Q8_0", "blk.36.ssm_beta.weight": "Q8_0", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q8_0", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q8_0", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q8_0", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "Q8_0", "blk.37.ssm_beta.weight": "Q8_0", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q8_0", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q8_0", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q8_0", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "Q8_0", "blk.38.ssm_beta.weight": "Q8_0", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q8_0", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q8_0", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q8_0", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q8_0", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q8_0", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q8_0", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "Q8_0", "blk.4.ssm_beta.weight": "Q8_0", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q8_0", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q8_0", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q8_0", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "Q8_0", "blk.5.ssm_beta.weight": "Q8_0", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q8_0", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q8_0", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q8_0", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "Q8_0", "blk.6.ssm_beta.weight": "Q8_0", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q8_0", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q8_0", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q8_0", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q8_0", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q8_0", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q8_0", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "Q8_0", "blk.8.ssm_beta.weight": "Q8_0", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q8_0", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q8_0", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q8_0", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "Q8_0", "blk.9.ssm_beta.weight": "Q8_0", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q8_0" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-Q6_K_1.gguf", "DisplayName": "MQ-Q6_K_1", "ShortName": "MQ-Q6_K_1", "Provider": "MagicQuant", "QuantFamily": "Q6_K", "BaseQuant": "Q6_K", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.005149, "SourcePpl": 5.673763, "SourcePplDeltaPercent": -0.23275892386144126, "SourceSizeBytes": 31590586784, "SourceSizeGB": 31.590586784000003, "SourceSizeGiB": 29.42102661728859, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q8_0", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q6_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q6_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q8_0", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q6_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q6_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q8_0", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q6_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q6_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q8_0", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q6_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q6_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q8_0", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q6_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q6_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q8_0", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q6_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q6_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q8_0", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q6_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q6_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q8_0", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q6_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q6_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q8_0", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q6_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q6_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q8_0", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q6_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q6_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q8_0", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q6_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q6_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q8_0", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q6_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q6_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q8_0", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q6_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q6_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q8_0", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q6_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q6_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q8_0", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q6_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q6_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q8_0", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q6_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q6_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q8_0", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q6_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q6_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q8_0", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q6_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q6_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q8_0", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q6_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q6_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q8_0", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q6_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q6_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q8_0", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q6_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q6_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q8_0", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q6_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q6_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q8_0", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q6_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q6_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q8_0", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q6_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q6_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q8_0", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q6_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q6_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q8_0", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q6_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q6_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q8_0", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q6_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q6_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q8_0", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q6_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q6_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q8_0", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q6_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q6_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q8_0", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q6_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q6_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q8_0", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q6_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q6_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q8_0", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q6_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q6_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q8_0", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q6_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q6_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q8_0", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q6_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q6_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q8_0", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q6_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q6_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q8_0", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q6_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q6_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q8_0", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q6_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q6_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q8_0", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q6_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q6_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q8_0", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q6_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q6_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q8_0", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q6_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q6_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-Q5_K_1.gguf", "DisplayName": "MQ-Q5_K_1", "ShortName": "MQ-Q5_K_1", "Provider": "MagicQuant", "QuantFamily": "Q5_K", "BaseQuant": "Q6_K", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.005523, "SourcePpl": 5.68002, "SourcePplDeltaPercent": -0.12273606470899297, "SourceSizeBytes": 29185153440, "SourceSizeGB": 29.18515344, "SourceSizeGiB": 27.18079224228859, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q6_K", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q6_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q6_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q6_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q6_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q6_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q6_K", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q6_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q6_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q6_K", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q6_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q6_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q6_K", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q6_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q6_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q6_K", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q6_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q6_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q6_K", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q6_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q6_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q6_K", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q6_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q6_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q6_K", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q6_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q6_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q6_K", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q6_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q6_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q6_K", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q6_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q6_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q6_K", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q6_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q6_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q6_K", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q6_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q6_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q6_K", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q6_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q6_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q6_K", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q6_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q6_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q6_K", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q6_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q6_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q6_K", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q6_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q6_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q6_K", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q6_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q6_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q6_K", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q6_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q6_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q6_K", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q6_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q6_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q6_K", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q6_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q6_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q6_K", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q6_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q6_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q6_K", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q6_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q6_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q6_K", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q6_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q6_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q6_K", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q6_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q6_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q6_K", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q6_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q6_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q6_K", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q6_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q6_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q6_K", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q6_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q6_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q8_0", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q6_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q6_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q6_K", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q6_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q6_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q6_K", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q6_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q6_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q6_K", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q6_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q6_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q8_0", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q6_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q6_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q8_0", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q6_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q6_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q6_K", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q6_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q6_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q6_K", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q6_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q6_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q6_K", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q6_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q6_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q6_K", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q6_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q6_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q6_K", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q6_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q6_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q6_K", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q6_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q6_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-Q5_K_S_1.gguf", "DisplayName": "MQ-Q5_K_S_1", "ShortName": "MQ-Q5_K_S_1", "Provider": "MagicQuant", "QuantFamily": "Q5_K_S", "BaseQuant": "Q5_K", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.00673, "SourcePpl": 5.679092, "SourcePplDeltaPercent": -0.1390539827677241, "SourceSizeBytes": 26333026720, "SourceSizeGB": 26.33302672, "SourceSizeGiB": 24.52454224228859, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q6_K", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q5_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q5_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q6_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q5_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q5_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q6_K", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q5_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q5_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q6_K", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q5_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q5_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q6_K", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q5_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q5_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q6_K", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q5_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q5_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q6_K", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q5_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q5_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q6_K", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q5_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q5_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q6_K", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q5_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q5_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q6_K", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q5_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q5_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q6_K", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q5_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q5_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q6_K", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q5_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q5_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q6_K", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q5_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q5_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q6_K", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q5_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q5_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q6_K", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q5_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q5_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q6_K", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q5_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q5_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q6_K", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q5_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q5_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q6_K", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q5_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q5_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q6_K", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q5_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q5_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q6_K", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q5_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q5_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q6_K", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q5_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q5_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q6_K", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q5_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q5_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q6_K", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q5_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q5_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q6_K", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q5_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q5_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q6_K", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q5_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q5_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q6_K", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q5_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q5_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q6_K", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q5_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q5_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q6_K", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q5_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q5_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q8_0", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q5_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q5_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q6_K", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q5_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q5_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q6_K", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q5_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q5_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q6_K", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q5_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q5_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q8_0", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q5_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q5_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q8_0", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q5_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q5_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q6_K", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q5_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q5_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q6_K", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q5_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q5_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q6_K", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q5_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q5_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q6_K", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q5_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q5_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q6_K", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q5_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q5_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q6_K", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q5_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q5_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-Q4_K_M_1.gguf", "DisplayName": "MQ-Q4_K_M_1", "ShortName": "MQ-Q4_K_M_1", "Provider": "MagicQuant", "QuantFamily": "Q4_K_M", "BaseQuant": "Q5_K_S", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.007799, "SourcePpl": 5.685451, "SourcePplDeltaPercent": -0.027237559345888666, "SourceSizeBytes": 24818882976, "SourceSizeGB": 24.818882976, "SourceSizeGiB": 23.11438599228859, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q5_K", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q5_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q5_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q5_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q5_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q5_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q5_K", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q5_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q5_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q5_K", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q5_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q5_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q5_K", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q5_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q5_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q5_K", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q5_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q5_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q5_K", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q5_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q5_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q5_K", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q5_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q5_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q5_K", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q5_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q5_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q5_K", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q5_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q5_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q5_K", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q5_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q5_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q5_K", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q5_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q5_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q5_K", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q5_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q5_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q5_K", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q5_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q5_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q5_K", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q5_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q5_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q5_K", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q5_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q5_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q5_K", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q5_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q5_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q5_K", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q5_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q5_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q5_K", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q5_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q5_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q5_K", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q5_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q5_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q5_K", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q5_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q5_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q5_K", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q5_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q5_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q5_K", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q5_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q5_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q5_K", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q5_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q5_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q5_K", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q5_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q5_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q5_K", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q5_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q5_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q5_K", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q5_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q5_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q5_K", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q5_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q5_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q6_K", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q5_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q5_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q5_K", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q5_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q5_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q5_K", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q5_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q5_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q5_K", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q5_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q5_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q6_K", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q5_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q5_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q6_K", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q5_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q5_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q5_K", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q5_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q5_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q5_K", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q5_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q5_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q5_K", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q5_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q5_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q5_K", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q5_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q5_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q5_K", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q5_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q5_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q5_K", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q5_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q5_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-Q4_K_M_2.gguf", "DisplayName": "MQ-Q4_K_M_2", "ShortName": "MQ-Q4_K_M_2", "Provider": "MagicQuant", "QuantFamily": "Q4_K_M", "BaseQuant": "Q4_K_M", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.011007, "SourcePpl": 5.694152, "SourcePplDeltaPercent": 0.12576050641813968, "SourceSizeBytes": 22324804000, "SourceSizeGB": 22.324804, "SourceSizeGiB": 20.791593939065933, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q5_K", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q4_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q4_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q5_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q5_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q5_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q5_K", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q4_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q4_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q5_K", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q4_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q4_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q5_K", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q4_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q4_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q5_K", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q4_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q4_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q5_K", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q4_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q4_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q5_K", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q4_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q4_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q5_K", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q4_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q4_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q5_K", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q4_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q4_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q5_K", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q4_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q4_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q5_K", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q4_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q4_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q5_K", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q4_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q4_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q5_K", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q4_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q4_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q5_K", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q4_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q4_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q5_K", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q4_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q4_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q5_K", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q4_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q4_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q5_K", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q4_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q4_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q5_K", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q4_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q4_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q5_K", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q4_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q4_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q5_K", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q4_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q4_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q5_K", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q4_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q4_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q5_K", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q4_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q4_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q5_K", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q4_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q4_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q5_K", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q4_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q4_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q5_K", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q4_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q4_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q5_K", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q4_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q4_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q5_K", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q4_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q4_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q6_K", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q4_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q4_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q5_K", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q4_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q4_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q5_K", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q4_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q4_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q5_K", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q4_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q4_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q6_K", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q4_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q4_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q6_K", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q4_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q4_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q5_K", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q4_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q4_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q5_K", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q4_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q4_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q5_K", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q4_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q4_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q5_K", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q4_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q4_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q5_K", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q4_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q4_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q5_K", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q4_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q4_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q8_0" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-IQ4_NL_1.gguf", "DisplayName": "MQ-IQ4_NL_1", "ShortName": "MQ-IQ4_NL_1", "Provider": "MagicQuant", "QuantFamily": "IQ4_NL", "BaseQuant": "Q8_0", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.013277, "SourcePpl": 5.708942, "SourcePplDeltaPercent": 0.38582732547916526, "SourceSizeBytes": 20887239072, "SourceSizeGB": 20.887239072, "SourceSizeGiB": 19.45275726914406, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q8_0", "blk.0.ffn_down_exps.weight": "Q4_K", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "Q4_K", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "Q4_K", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "Q8_0", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q8_0", "blk.1.ffn_down_exps.weight": "Q4_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "Q4_K", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "Q4_K", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "Q8_0", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q8_0", "blk.10.ffn_down_exps.weight": "Q4_K", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "Q4_K", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "Q4_K", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "Q8_0", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q8_0", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "Q4_K", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "Q4_K", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "Q4_K", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q8_0", "blk.12.ffn_down_exps.weight": "Q4_K", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "Q4_K", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "Q4_K", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "Q8_0", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q8_0", "blk.13.ffn_down_exps.weight": "Q4_K", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "Q4_K", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "Q4_K", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "Q8_0", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q8_0", "blk.14.ffn_down_exps.weight": "Q4_K", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "Q4_K", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "Q4_K", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "Q8_0", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q8_0", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "Q4_K", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "Q4_K", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "Q4_K", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q8_0", "blk.16.ffn_down_exps.weight": "Q4_K", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "Q4_K", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "Q4_K", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "Q8_0", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q8_0", "blk.17.ffn_down_exps.weight": "Q4_K", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "Q4_K", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "Q4_K", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "Q8_0", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q8_0", "blk.18.ffn_down_exps.weight": "Q4_K", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "Q4_K", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "Q4_K", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "Q8_0", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q8_0", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "Q4_K", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "Q4_K", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "Q4_K", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q8_0", "blk.2.ffn_down_exps.weight": "Q4_K", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "Q4_K", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "Q4_K", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "Q8_0", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q8_0", "blk.20.ffn_down_exps.weight": "Q4_K", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "Q4_K", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "Q4_K", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "Q8_0", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q8_0", "blk.21.ffn_down_exps.weight": "Q4_K", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "Q4_K", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "Q4_K", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "Q8_0", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q8_0", "blk.22.ffn_down_exps.weight": "Q4_K", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "Q4_K", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "Q4_K", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "Q8_0", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q8_0", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "Q4_K", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "Q4_K", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "Q4_K", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q8_0", "blk.24.ffn_down_exps.weight": "Q4_K", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "Q4_K", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "Q4_K", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "Q8_0", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q8_0", "blk.25.ffn_down_exps.weight": "Q4_K", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "Q4_K", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "Q4_K", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "Q8_0", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q8_0", "blk.26.ffn_down_exps.weight": "Q4_K", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "Q4_K", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "Q4_K", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "Q8_0", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q8_0", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "Q4_K", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "Q4_K", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "Q4_K", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q8_0", "blk.28.ffn_down_exps.weight": "Q4_K", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "Q4_K", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "Q4_K", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "Q8_0", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q8_0", "blk.29.ffn_down_exps.weight": "Q4_K", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "Q4_K", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "Q4_K", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "Q8_0", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q8_0", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "Q4_K", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "Q4_K", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "Q4_K", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q8_0", "blk.30.ffn_down_exps.weight": "Q4_K", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "Q4_K", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "Q4_K", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "Q8_0", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q8_0", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "Q4_K", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "Q4_K", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "Q4_K", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q8_0", "blk.32.ffn_down_exps.weight": "Q4_K", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "Q4_K", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "Q4_K", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "Q8_0", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q8_0", "blk.33.ffn_down_exps.weight": "Q4_K", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "Q4_K", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "Q4_K", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "Q8_0", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q8_0", "blk.34.ffn_down_exps.weight": "Q6_K", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "Q4_K", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "Q4_K", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "Q8_0", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q8_0", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "Q4_K", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "Q4_K", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "Q4_K", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q8_0", "blk.36.ffn_down_exps.weight": "Q4_K", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "Q4_K", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "Q4_K", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "Q8_0", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q8_0", "blk.37.ffn_down_exps.weight": "Q4_K", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "Q4_K", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "Q4_K", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "Q8_0", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q8_0", "blk.38.ffn_down_exps.weight": "Q6_K", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "Q4_K", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "Q4_K", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "Q8_0", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q8_0", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q6_K", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "Q4_K", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "Q4_K", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q8_0", "blk.4.ffn_down_exps.weight": "Q4_K", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "Q4_K", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "Q4_K", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "Q8_0", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q8_0", "blk.5.ffn_down_exps.weight": "Q4_K", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "Q4_K", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "Q4_K", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "Q8_0", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q8_0", "blk.6.ffn_down_exps.weight": "Q4_K", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "Q4_K", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "Q4_K", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "Q8_0", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q8_0", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "Q4_K", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "Q4_K", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "Q4_K", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q8_0", "blk.8.ffn_down_exps.weight": "Q4_K", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "Q4_K", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "Q4_K", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "Q8_0", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q8_0", "blk.9.ffn_down_exps.weight": "Q4_K", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "Q4_K", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "Q4_K", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "Q8_0", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-IQ3_M_1.gguf", "DisplayName": "MQ-IQ3_M_1", "ShortName": "MQ-IQ3_M_1", "Provider": "MagicQuant", "QuantFamily": "IQ3_M", "BaseQuant": "Q8_0", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.02633, "SourcePpl": 5.764787, "SourcePplDeltaPercent": 1.3678037629681699, "SourceSizeBytes": 17604147616, "SourceSizeGB": 17.604147616000002, "SourceSizeGiB": 16.39514008164406, "TensorTypes": { "blk.0.attn_gate.weight": "Q8_0", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q6_K", "blk.0.ffn_down_exps.weight": "IQ4_XS", "blk.0.ffn_down_shexp.weight": "Q8_0", "blk.0.ffn_gate_exps.weight": "IQ3_S", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q8_0", "blk.0.ffn_up_exps.weight": "IQ3_S", "blk.0.ffn_up_shexp.weight": "Q8_0", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "Q8_0", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q8_0", "blk.1.attn_gate.weight": "Q8_0", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q6_K", "blk.1.ffn_down_exps.weight": "Q5_K", "blk.1.ffn_down_shexp.weight": "Q8_0", "blk.1.ffn_gate_exps.weight": "IQ3_S", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q8_0", "blk.1.ffn_up_exps.weight": "IQ3_S", "blk.1.ffn_up_shexp.weight": "Q8_0", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "Q8_0", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q8_0", "blk.10.attn_gate.weight": "Q8_0", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q6_K", "blk.10.ffn_down_exps.weight": "IQ4_XS", "blk.10.ffn_down_shexp.weight": "Q8_0", "blk.10.ffn_gate_exps.weight": "IQ3_S", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q8_0", "blk.10.ffn_up_exps.weight": "IQ3_S", "blk.10.ffn_up_shexp.weight": "Q8_0", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "Q8_0", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q8_0", "blk.11.attn_k.weight": "Q8_0", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q8_0", "blk.11.attn_q.weight": "Q6_K", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q8_0", "blk.11.ffn_down_exps.weight": "IQ4_XS", "blk.11.ffn_down_shexp.weight": "Q8_0", "blk.11.ffn_gate_exps.weight": "IQ3_S", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q8_0", "blk.11.ffn_up_exps.weight": "IQ3_S", "blk.11.ffn_up_shexp.weight": "Q8_0", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q8_0", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q6_K", "blk.12.ffn_down_exps.weight": "IQ4_XS", "blk.12.ffn_down_shexp.weight": "Q8_0", "blk.12.ffn_gate_exps.weight": "IQ3_S", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q8_0", "blk.12.ffn_up_exps.weight": "IQ3_S", "blk.12.ffn_up_shexp.weight": "Q8_0", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "Q8_0", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q8_0", "blk.13.attn_gate.weight": "Q8_0", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q6_K", "blk.13.ffn_down_exps.weight": "IQ4_XS", "blk.13.ffn_down_shexp.weight": "Q8_0", "blk.13.ffn_gate_exps.weight": "IQ3_S", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q8_0", "blk.13.ffn_up_exps.weight": "IQ3_S", "blk.13.ffn_up_shexp.weight": "Q8_0", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "Q8_0", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q8_0", "blk.14.attn_gate.weight": "Q8_0", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q6_K", "blk.14.ffn_down_exps.weight": "IQ4_XS", "blk.14.ffn_down_shexp.weight": "Q8_0", "blk.14.ffn_gate_exps.weight": "IQ3_S", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q8_0", "blk.14.ffn_up_exps.weight": "IQ3_S", "blk.14.ffn_up_shexp.weight": "Q8_0", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "Q8_0", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q8_0", "blk.15.attn_k.weight": "Q8_0", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q8_0", "blk.15.attn_q.weight": "Q6_K", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q8_0", "blk.15.ffn_down_exps.weight": "IQ4_XS", "blk.15.ffn_down_shexp.weight": "Q8_0", "blk.15.ffn_gate_exps.weight": "IQ3_S", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q8_0", "blk.15.ffn_up_exps.weight": "IQ3_S", "blk.15.ffn_up_shexp.weight": "Q8_0", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q8_0", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q6_K", "blk.16.ffn_down_exps.weight": "IQ4_XS", "blk.16.ffn_down_shexp.weight": "Q8_0", "blk.16.ffn_gate_exps.weight": "IQ3_S", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q8_0", "blk.16.ffn_up_exps.weight": "IQ3_S", "blk.16.ffn_up_shexp.weight": "Q8_0", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "Q8_0", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q8_0", "blk.17.attn_gate.weight": "Q8_0", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q6_K", "blk.17.ffn_down_exps.weight": "IQ4_XS", "blk.17.ffn_down_shexp.weight": "Q8_0", "blk.17.ffn_gate_exps.weight": "IQ3_S", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q8_0", "blk.17.ffn_up_exps.weight": "IQ3_S", "blk.17.ffn_up_shexp.weight": "Q8_0", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "Q8_0", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q8_0", "blk.18.attn_gate.weight": "Q8_0", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q6_K", "blk.18.ffn_down_exps.weight": "IQ4_XS", "blk.18.ffn_down_shexp.weight": "Q8_0", "blk.18.ffn_gate_exps.weight": "IQ3_S", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q8_0", "blk.18.ffn_up_exps.weight": "IQ3_S", "blk.18.ffn_up_shexp.weight": "Q8_0", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "Q8_0", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q8_0", "blk.19.attn_k.weight": "Q8_0", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q8_0", "blk.19.attn_q.weight": "Q6_K", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q8_0", "blk.19.ffn_down_exps.weight": "IQ4_XS", "blk.19.ffn_down_shexp.weight": "Q8_0", "blk.19.ffn_gate_exps.weight": "IQ3_S", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q8_0", "blk.19.ffn_up_exps.weight": "IQ3_S", "blk.19.ffn_up_shexp.weight": "Q8_0", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q8_0", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q6_K", "blk.2.ffn_down_exps.weight": "IQ4_XS", "blk.2.ffn_down_shexp.weight": "Q8_0", "blk.2.ffn_gate_exps.weight": "IQ3_S", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q8_0", "blk.2.ffn_up_exps.weight": "IQ3_S", "blk.2.ffn_up_shexp.weight": "Q8_0", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "Q8_0", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q8_0", "blk.20.attn_gate.weight": "Q8_0", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q6_K", "blk.20.ffn_down_exps.weight": "IQ4_XS", "blk.20.ffn_down_shexp.weight": "Q8_0", "blk.20.ffn_gate_exps.weight": "IQ3_S", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q8_0", "blk.20.ffn_up_exps.weight": "IQ3_S", "blk.20.ffn_up_shexp.weight": "Q8_0", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "Q8_0", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q8_0", "blk.21.attn_gate.weight": "Q8_0", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q6_K", "blk.21.ffn_down_exps.weight": "IQ4_XS", "blk.21.ffn_down_shexp.weight": "Q8_0", "blk.21.ffn_gate_exps.weight": "IQ3_S", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q8_0", "blk.21.ffn_up_exps.weight": "IQ3_S", "blk.21.ffn_up_shexp.weight": "Q8_0", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "Q8_0", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q8_0", "blk.22.attn_gate.weight": "Q8_0", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q6_K", "blk.22.ffn_down_exps.weight": "IQ4_XS", "blk.22.ffn_down_shexp.weight": "Q8_0", "blk.22.ffn_gate_exps.weight": "IQ3_S", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q8_0", "blk.22.ffn_up_exps.weight": "IQ3_S", "blk.22.ffn_up_shexp.weight": "Q8_0", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "Q8_0", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q8_0", "blk.23.attn_k.weight": "Q8_0", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q8_0", "blk.23.attn_q.weight": "Q6_K", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q8_0", "blk.23.ffn_down_exps.weight": "IQ4_XS", "blk.23.ffn_down_shexp.weight": "Q8_0", "blk.23.ffn_gate_exps.weight": "IQ3_S", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q8_0", "blk.23.ffn_up_exps.weight": "IQ3_S", "blk.23.ffn_up_shexp.weight": "Q8_0", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q8_0", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q6_K", "blk.24.ffn_down_exps.weight": "IQ4_XS", "blk.24.ffn_down_shexp.weight": "Q8_0", "blk.24.ffn_gate_exps.weight": "IQ3_S", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q8_0", "blk.24.ffn_up_exps.weight": "IQ3_S", "blk.24.ffn_up_shexp.weight": "Q8_0", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "Q8_0", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q8_0", "blk.25.attn_gate.weight": "Q8_0", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q6_K", "blk.25.ffn_down_exps.weight": "IQ4_XS", "blk.25.ffn_down_shexp.weight": "Q8_0", "blk.25.ffn_gate_exps.weight": "IQ3_S", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q8_0", "blk.25.ffn_up_exps.weight": "IQ3_S", "blk.25.ffn_up_shexp.weight": "Q8_0", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "Q8_0", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q8_0", "blk.26.attn_gate.weight": "Q8_0", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q6_K", "blk.26.ffn_down_exps.weight": "IQ4_XS", "blk.26.ffn_down_shexp.weight": "Q8_0", "blk.26.ffn_gate_exps.weight": "IQ3_S", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q8_0", "blk.26.ffn_up_exps.weight": "IQ3_S", "blk.26.ffn_up_shexp.weight": "Q8_0", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "Q8_0", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q8_0", "blk.27.attn_k.weight": "Q8_0", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q8_0", "blk.27.attn_q.weight": "Q6_K", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q8_0", "blk.27.ffn_down_exps.weight": "IQ4_XS", "blk.27.ffn_down_shexp.weight": "Q8_0", "blk.27.ffn_gate_exps.weight": "IQ3_S", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q8_0", "blk.27.ffn_up_exps.weight": "IQ3_S", "blk.27.ffn_up_shexp.weight": "Q8_0", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q8_0", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q6_K", "blk.28.ffn_down_exps.weight": "IQ4_XS", "blk.28.ffn_down_shexp.weight": "Q8_0", "blk.28.ffn_gate_exps.weight": "IQ3_S", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q8_0", "blk.28.ffn_up_exps.weight": "IQ3_S", "blk.28.ffn_up_shexp.weight": "Q8_0", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "Q8_0", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q8_0", "blk.29.attn_gate.weight": "Q8_0", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q6_K", "blk.29.ffn_down_exps.weight": "IQ4_XS", "blk.29.ffn_down_shexp.weight": "Q8_0", "blk.29.ffn_gate_exps.weight": "IQ3_S", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q8_0", "blk.29.ffn_up_exps.weight": "IQ3_S", "blk.29.ffn_up_shexp.weight": "Q8_0", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "Q8_0", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q8_0", "blk.3.attn_k.weight": "Q8_0", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q8_0", "blk.3.attn_q.weight": "Q6_K", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q8_0", "blk.3.ffn_down_exps.weight": "IQ4_XS", "blk.3.ffn_down_shexp.weight": "Q8_0", "blk.3.ffn_gate_exps.weight": "IQ3_S", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q8_0", "blk.3.ffn_up_exps.weight": "IQ3_S", "blk.3.ffn_up_shexp.weight": "Q8_0", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q8_0", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q6_K", "blk.30.ffn_down_exps.weight": "IQ4_XS", "blk.30.ffn_down_shexp.weight": "Q8_0", "blk.30.ffn_gate_exps.weight": "IQ3_S", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q8_0", "blk.30.ffn_up_exps.weight": "IQ3_S", "blk.30.ffn_up_shexp.weight": "Q8_0", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "Q8_0", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q8_0", "blk.31.attn_k.weight": "Q8_0", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q8_0", "blk.31.attn_q.weight": "Q6_K", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q8_0", "blk.31.ffn_down_exps.weight": "IQ4_XS", "blk.31.ffn_down_shexp.weight": "Q8_0", "blk.31.ffn_gate_exps.weight": "IQ3_S", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q8_0", "blk.31.ffn_up_exps.weight": "IQ3_S", "blk.31.ffn_up_shexp.weight": "Q8_0", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q8_0", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q6_K", "blk.32.ffn_down_exps.weight": "IQ4_XS", "blk.32.ffn_down_shexp.weight": "Q8_0", "blk.32.ffn_gate_exps.weight": "IQ3_S", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q8_0", "blk.32.ffn_up_exps.weight": "IQ3_S", "blk.32.ffn_up_shexp.weight": "Q8_0", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "Q8_0", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q8_0", "blk.33.attn_gate.weight": "Q8_0", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q6_K", "blk.33.ffn_down_exps.weight": "IQ4_XS", "blk.33.ffn_down_shexp.weight": "Q8_0", "blk.33.ffn_gate_exps.weight": "IQ3_S", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q8_0", "blk.33.ffn_up_exps.weight": "IQ3_S", "blk.33.ffn_up_shexp.weight": "Q8_0", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "Q8_0", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q8_0", "blk.34.attn_gate.weight": "Q8_0", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q6_K", "blk.34.ffn_down_exps.weight": "Q6_K", "blk.34.ffn_down_shexp.weight": "Q8_0", "blk.34.ffn_gate_exps.weight": "IQ3_S", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q8_0", "blk.34.ffn_up_exps.weight": "IQ3_S", "blk.34.ffn_up_shexp.weight": "Q8_0", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "Q8_0", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q8_0", "blk.35.attn_k.weight": "Q8_0", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q8_0", "blk.35.attn_q.weight": "Q6_K", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q8_0", "blk.35.ffn_down_exps.weight": "IQ4_XS", "blk.35.ffn_down_shexp.weight": "Q8_0", "blk.35.ffn_gate_exps.weight": "IQ3_S", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q8_0", "blk.35.ffn_up_exps.weight": "IQ3_S", "blk.35.ffn_up_shexp.weight": "Q8_0", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q8_0", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q6_K", "blk.36.ffn_down_exps.weight": "IQ4_XS", "blk.36.ffn_down_shexp.weight": "Q8_0", "blk.36.ffn_gate_exps.weight": "IQ3_S", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q8_0", "blk.36.ffn_up_exps.weight": "IQ3_S", "blk.36.ffn_up_shexp.weight": "Q8_0", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "Q8_0", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q8_0", "blk.37.attn_gate.weight": "Q8_0", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q6_K", "blk.37.ffn_down_exps.weight": "IQ4_XS", "blk.37.ffn_down_shexp.weight": "Q8_0", "blk.37.ffn_gate_exps.weight": "IQ3_S", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q8_0", "blk.37.ffn_up_exps.weight": "IQ3_S", "blk.37.ffn_up_shexp.weight": "Q8_0", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "Q8_0", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q8_0", "blk.38.attn_gate.weight": "Q8_0", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q6_K", "blk.38.ffn_down_exps.weight": "Q6_K", "blk.38.ffn_down_shexp.weight": "Q8_0", "blk.38.ffn_gate_exps.weight": "IQ3_S", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q8_0", "blk.38.ffn_up_exps.weight": "IQ3_S", "blk.38.ffn_up_shexp.weight": "Q8_0", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "Q8_0", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q8_0", "blk.39.attn_k.weight": "Q8_0", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q8_0", "blk.39.attn_q.weight": "Q6_K", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q8_0", "blk.39.ffn_down_exps.weight": "Q6_K", "blk.39.ffn_down_shexp.weight": "Q8_0", "blk.39.ffn_gate_exps.weight": "IQ3_S", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q8_0", "blk.39.ffn_up_exps.weight": "IQ3_S", "blk.39.ffn_up_shexp.weight": "Q8_0", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q8_0", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q6_K", "blk.4.ffn_down_exps.weight": "IQ4_XS", "blk.4.ffn_down_shexp.weight": "Q8_0", "blk.4.ffn_gate_exps.weight": "IQ3_S", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q8_0", "blk.4.ffn_up_exps.weight": "IQ3_S", "blk.4.ffn_up_shexp.weight": "Q8_0", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "Q8_0", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q8_0", "blk.5.attn_gate.weight": "Q8_0", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q6_K", "blk.5.ffn_down_exps.weight": "IQ4_XS", "blk.5.ffn_down_shexp.weight": "Q8_0", "blk.5.ffn_gate_exps.weight": "IQ3_S", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q8_0", "blk.5.ffn_up_exps.weight": "IQ3_S", "blk.5.ffn_up_shexp.weight": "Q8_0", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "Q8_0", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q8_0", "blk.6.attn_gate.weight": "Q8_0", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q6_K", "blk.6.ffn_down_exps.weight": "IQ4_XS", "blk.6.ffn_down_shexp.weight": "Q8_0", "blk.6.ffn_gate_exps.weight": "IQ3_S", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q8_0", "blk.6.ffn_up_exps.weight": "IQ3_S", "blk.6.ffn_up_shexp.weight": "Q8_0", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "Q8_0", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q8_0", "blk.7.attn_k.weight": "Q8_0", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q8_0", "blk.7.attn_q.weight": "Q6_K", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q8_0", "blk.7.ffn_down_exps.weight": "IQ4_XS", "blk.7.ffn_down_shexp.weight": "Q8_0", "blk.7.ffn_gate_exps.weight": "IQ3_S", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q8_0", "blk.7.ffn_up_exps.weight": "IQ3_S", "blk.7.ffn_up_shexp.weight": "Q8_0", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q8_0", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q6_K", "blk.8.ffn_down_exps.weight": "IQ4_XS", "blk.8.ffn_down_shexp.weight": "Q8_0", "blk.8.ffn_gate_exps.weight": "IQ3_S", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q8_0", "blk.8.ffn_up_exps.weight": "IQ3_S", "blk.8.ffn_up_shexp.weight": "Q8_0", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "Q8_0", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q8_0", "blk.9.attn_gate.weight": "Q8_0", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q6_K", "blk.9.ffn_down_exps.weight": "IQ4_XS", "blk.9.ffn_down_shexp.weight": "Q8_0", "blk.9.ffn_gate_exps.weight": "IQ3_S", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q8_0", "blk.9.ffn_up_exps.weight": "IQ3_S", "blk.9.ffn_up_shexp.weight": "Q8_0", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "Q8_0", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q8_0", "output.weight": "Q8_0", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-UD-IQ3_S.gguf", "DisplayName": "UD-IQ3_S", "ShortName": "UD-IQ3_S", "Provider": "Unsloth", "QuantFamily": "UD-IQ3_S", "BaseQuant": "IQ3_S", "IsHybrid": false, "UsedImatrix": true, "SourceKld": 0.068376, "SourcePpl": 5.970404, "SourcePplDeltaPercent": 4.983365570599613, "SourceSizeBytes": 13676722592, "SourceSizeGB": 13.676722592, "SourceSizeGiB": 12.73744049668312, "TensorTypes": { "blk.0.attn_gate.weight": "Q6_K", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q6_K", "blk.0.ffn_down_exps.weight": "IQ3_S", "blk.0.ffn_down_shexp.weight": "Q6_K", "blk.0.ffn_gate_exps.weight": "IQ2_S", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "Q6_K", "blk.0.ffn_up_exps.weight": "IQ2_S", "blk.0.ffn_up_shexp.weight": "Q6_K", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "F32", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "Q6_K", "blk.1.attn_gate.weight": "Q6_K", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q6_K", "blk.1.ffn_down_exps.weight": "IQ3_S", "blk.1.ffn_down_shexp.weight": "Q6_K", "blk.1.ffn_gate_exps.weight": "IQ2_S", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "Q6_K", "blk.1.ffn_up_exps.weight": "IQ2_S", "blk.1.ffn_up_shexp.weight": "Q6_K", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "F32", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "Q6_K", "blk.10.attn_gate.weight": "Q6_K", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q6_K", "blk.10.ffn_down_exps.weight": "IQ3_S", "blk.10.ffn_down_shexp.weight": "Q6_K", "blk.10.ffn_gate_exps.weight": "IQ2_S", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "Q6_K", "blk.10.ffn_up_exps.weight": "IQ2_S", "blk.10.ffn_up_shexp.weight": "Q6_K", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "F32", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "Q6_K", "blk.11.attn_k.weight": "Q6_K", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "Q6_K", "blk.11.attn_q.weight": "Q6_K", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q6_K", "blk.11.ffn_down_exps.weight": "IQ3_S", "blk.11.ffn_down_shexp.weight": "Q6_K", "blk.11.ffn_gate_exps.weight": "IQ2_S", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "Q6_K", "blk.11.ffn_up_exps.weight": "IQ2_S", "blk.11.ffn_up_shexp.weight": "Q6_K", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "Q6_K", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q6_K", "blk.12.ffn_down_exps.weight": "IQ3_S", "blk.12.ffn_down_shexp.weight": "Q6_K", "blk.12.ffn_gate_exps.weight": "IQ2_S", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "Q6_K", "blk.12.ffn_up_exps.weight": "IQ2_S", "blk.12.ffn_up_shexp.weight": "Q6_K", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "F32", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "Q6_K", "blk.13.attn_gate.weight": "Q6_K", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q6_K", "blk.13.ffn_down_exps.weight": "IQ3_S", "blk.13.ffn_down_shexp.weight": "Q6_K", "blk.13.ffn_gate_exps.weight": "IQ2_S", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "Q6_K", "blk.13.ffn_up_exps.weight": "IQ2_S", "blk.13.ffn_up_shexp.weight": "Q6_K", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "F32", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "Q6_K", "blk.14.attn_gate.weight": "Q6_K", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q6_K", "blk.14.ffn_down_exps.weight": "IQ3_S", "blk.14.ffn_down_shexp.weight": "Q6_K", "blk.14.ffn_gate_exps.weight": "IQ2_S", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "Q6_K", "blk.14.ffn_up_exps.weight": "IQ2_S", "blk.14.ffn_up_shexp.weight": "Q6_K", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "F32", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "Q6_K", "blk.15.attn_k.weight": "Q6_K", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "Q6_K", "blk.15.attn_q.weight": "Q6_K", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q6_K", "blk.15.ffn_down_exps.weight": "IQ3_S", "blk.15.ffn_down_shexp.weight": "Q6_K", "blk.15.ffn_gate_exps.weight": "IQ2_S", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "Q6_K", "blk.15.ffn_up_exps.weight": "IQ2_S", "blk.15.ffn_up_shexp.weight": "Q6_K", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "Q6_K", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q6_K", "blk.16.ffn_down_exps.weight": "IQ3_S", "blk.16.ffn_down_shexp.weight": "Q6_K", "blk.16.ffn_gate_exps.weight": "IQ2_S", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "Q6_K", "blk.16.ffn_up_exps.weight": "IQ2_S", "blk.16.ffn_up_shexp.weight": "Q6_K", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "F32", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "Q6_K", "blk.17.attn_gate.weight": "Q6_K", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q6_K", "blk.17.ffn_down_exps.weight": "IQ3_S", "blk.17.ffn_down_shexp.weight": "Q6_K", "blk.17.ffn_gate_exps.weight": "IQ2_S", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "Q6_K", "blk.17.ffn_up_exps.weight": "IQ2_S", "blk.17.ffn_up_shexp.weight": "Q6_K", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "F32", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "Q6_K", "blk.18.attn_gate.weight": "Q6_K", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q6_K", "blk.18.ffn_down_exps.weight": "IQ3_S", "blk.18.ffn_down_shexp.weight": "Q6_K", "blk.18.ffn_gate_exps.weight": "IQ2_S", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "Q6_K", "blk.18.ffn_up_exps.weight": "IQ2_S", "blk.18.ffn_up_shexp.weight": "Q6_K", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "F32", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "Q6_K", "blk.19.attn_k.weight": "Q6_K", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "Q6_K", "blk.19.attn_q.weight": "Q6_K", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q6_K", "blk.19.ffn_down_exps.weight": "IQ3_S", "blk.19.ffn_down_shexp.weight": "Q6_K", "blk.19.ffn_gate_exps.weight": "IQ2_S", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "Q6_K", "blk.19.ffn_up_exps.weight": "IQ2_S", "blk.19.ffn_up_shexp.weight": "Q6_K", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "Q6_K", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q6_K", "blk.2.ffn_down_exps.weight": "IQ3_S", "blk.2.ffn_down_shexp.weight": "Q6_K", "blk.2.ffn_gate_exps.weight": "IQ2_S", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "Q6_K", "blk.2.ffn_up_exps.weight": "IQ2_S", "blk.2.ffn_up_shexp.weight": "Q6_K", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "F32", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "Q6_K", "blk.20.attn_gate.weight": "Q6_K", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q6_K", "blk.20.ffn_down_exps.weight": "IQ3_S", "blk.20.ffn_down_shexp.weight": "Q6_K", "blk.20.ffn_gate_exps.weight": "IQ2_S", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "Q6_K", "blk.20.ffn_up_exps.weight": "IQ2_S", "blk.20.ffn_up_shexp.weight": "Q6_K", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "F32", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "Q6_K", "blk.21.attn_gate.weight": "Q6_K", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q6_K", "blk.21.ffn_down_exps.weight": "IQ3_S", "blk.21.ffn_down_shexp.weight": "Q6_K", "blk.21.ffn_gate_exps.weight": "IQ2_S", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "Q6_K", "blk.21.ffn_up_exps.weight": "IQ2_S", "blk.21.ffn_up_shexp.weight": "Q6_K", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "F32", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "Q6_K", "blk.22.attn_gate.weight": "Q6_K", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q6_K", "blk.22.ffn_down_exps.weight": "IQ3_S", "blk.22.ffn_down_shexp.weight": "Q6_K", "blk.22.ffn_gate_exps.weight": "IQ2_S", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "Q6_K", "blk.22.ffn_up_exps.weight": "IQ2_S", "blk.22.ffn_up_shexp.weight": "Q6_K", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "F32", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "Q6_K", "blk.23.attn_k.weight": "Q6_K", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "Q6_K", "blk.23.attn_q.weight": "Q6_K", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q6_K", "blk.23.ffn_down_exps.weight": "IQ3_S", "blk.23.ffn_down_shexp.weight": "Q6_K", "blk.23.ffn_gate_exps.weight": "IQ2_S", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "Q6_K", "blk.23.ffn_up_exps.weight": "IQ2_S", "blk.23.ffn_up_shexp.weight": "Q6_K", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "Q6_K", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q6_K", "blk.24.ffn_down_exps.weight": "IQ3_S", "blk.24.ffn_down_shexp.weight": "Q6_K", "blk.24.ffn_gate_exps.weight": "IQ2_S", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "Q6_K", "blk.24.ffn_up_exps.weight": "IQ2_S", "blk.24.ffn_up_shexp.weight": "Q6_K", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "F32", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "Q6_K", "blk.25.attn_gate.weight": "Q6_K", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q6_K", "blk.25.ffn_down_exps.weight": "IQ3_S", "blk.25.ffn_down_shexp.weight": "Q6_K", "blk.25.ffn_gate_exps.weight": "IQ2_S", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "Q6_K", "blk.25.ffn_up_exps.weight": "IQ2_S", "blk.25.ffn_up_shexp.weight": "Q6_K", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "F32", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "Q6_K", "blk.26.attn_gate.weight": "Q6_K", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q6_K", "blk.26.ffn_down_exps.weight": "IQ3_S", "blk.26.ffn_down_shexp.weight": "Q6_K", "blk.26.ffn_gate_exps.weight": "IQ2_S", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "Q6_K", "blk.26.ffn_up_exps.weight": "IQ2_S", "blk.26.ffn_up_shexp.weight": "Q6_K", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "F32", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "Q6_K", "blk.27.attn_k.weight": "Q6_K", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "Q6_K", "blk.27.attn_q.weight": "Q6_K", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q6_K", "blk.27.ffn_down_exps.weight": "IQ3_S", "blk.27.ffn_down_shexp.weight": "Q6_K", "blk.27.ffn_gate_exps.weight": "IQ2_S", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "Q6_K", "blk.27.ffn_up_exps.weight": "IQ2_S", "blk.27.ffn_up_shexp.weight": "Q6_K", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "Q6_K", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q6_K", "blk.28.ffn_down_exps.weight": "IQ3_S", "blk.28.ffn_down_shexp.weight": "Q6_K", "blk.28.ffn_gate_exps.weight": "IQ2_S", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "Q6_K", "blk.28.ffn_up_exps.weight": "IQ2_S", "blk.28.ffn_up_shexp.weight": "Q6_K", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "F32", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "Q6_K", "blk.29.attn_gate.weight": "Q6_K", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q6_K", "blk.29.ffn_down_exps.weight": "IQ3_S", "blk.29.ffn_down_shexp.weight": "Q6_K", "blk.29.ffn_gate_exps.weight": "IQ2_S", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "Q6_K", "blk.29.ffn_up_exps.weight": "IQ2_S", "blk.29.ffn_up_shexp.weight": "Q6_K", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "F32", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "Q6_K", "blk.3.attn_k.weight": "Q6_K", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "Q6_K", "blk.3.attn_q.weight": "Q6_K", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q6_K", "blk.3.ffn_down_exps.weight": "IQ3_S", "blk.3.ffn_down_shexp.weight": "Q6_K", "blk.3.ffn_gate_exps.weight": "IQ2_S", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "Q6_K", "blk.3.ffn_up_exps.weight": "IQ2_S", "blk.3.ffn_up_shexp.weight": "Q6_K", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "Q6_K", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q6_K", "blk.30.ffn_down_exps.weight": "IQ3_S", "blk.30.ffn_down_shexp.weight": "Q6_K", "blk.30.ffn_gate_exps.weight": "IQ2_S", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "Q6_K", "blk.30.ffn_up_exps.weight": "IQ2_S", "blk.30.ffn_up_shexp.weight": "Q6_K", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "F32", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "Q6_K", "blk.31.attn_k.weight": "Q6_K", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "Q6_K", "blk.31.attn_q.weight": "Q6_K", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q6_K", "blk.31.ffn_down_exps.weight": "IQ3_S", "blk.31.ffn_down_shexp.weight": "Q6_K", "blk.31.ffn_gate_exps.weight": "IQ2_S", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "Q6_K", "blk.31.ffn_up_exps.weight": "IQ2_S", "blk.31.ffn_up_shexp.weight": "Q6_K", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "Q6_K", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q6_K", "blk.32.ffn_down_exps.weight": "IQ3_S", "blk.32.ffn_down_shexp.weight": "Q6_K", "blk.32.ffn_gate_exps.weight": "IQ2_S", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "Q6_K", "blk.32.ffn_up_exps.weight": "IQ2_S", "blk.32.ffn_up_shexp.weight": "Q6_K", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "F32", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "Q6_K", "blk.33.attn_gate.weight": "Q6_K", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q6_K", "blk.33.ffn_down_exps.weight": "IQ3_S", "blk.33.ffn_down_shexp.weight": "Q6_K", "blk.33.ffn_gate_exps.weight": "IQ2_S", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "Q6_K", "blk.33.ffn_up_exps.weight": "IQ2_S", "blk.33.ffn_up_shexp.weight": "Q6_K", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "F32", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "Q6_K", "blk.34.attn_gate.weight": "Q6_K", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q6_K", "blk.34.ffn_down_exps.weight": "IQ4_XS", "blk.34.ffn_down_shexp.weight": "Q6_K", "blk.34.ffn_gate_exps.weight": "IQ2_S", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "Q6_K", "blk.34.ffn_up_exps.weight": "IQ2_S", "blk.34.ffn_up_shexp.weight": "Q6_K", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "F32", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "Q6_K", "blk.35.attn_k.weight": "Q6_K", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "Q6_K", "blk.35.attn_q.weight": "Q6_K", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q6_K", "blk.35.ffn_down_exps.weight": "IQ3_S", "blk.35.ffn_down_shexp.weight": "Q6_K", "blk.35.ffn_gate_exps.weight": "IQ2_S", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "Q6_K", "blk.35.ffn_up_exps.weight": "IQ2_S", "blk.35.ffn_up_shexp.weight": "Q6_K", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "Q6_K", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q6_K", "blk.36.ffn_down_exps.weight": "IQ3_S", "blk.36.ffn_down_shexp.weight": "Q6_K", "blk.36.ffn_gate_exps.weight": "IQ2_S", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "Q6_K", "blk.36.ffn_up_exps.weight": "IQ2_S", "blk.36.ffn_up_shexp.weight": "Q6_K", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "F32", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "Q6_K", "blk.37.attn_gate.weight": "Q6_K", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q6_K", "blk.37.ffn_down_exps.weight": "IQ3_S", "blk.37.ffn_down_shexp.weight": "Q6_K", "blk.37.ffn_gate_exps.weight": "IQ2_S", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "Q6_K", "blk.37.ffn_up_exps.weight": "IQ2_S", "blk.37.ffn_up_shexp.weight": "Q6_K", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "F32", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "Q6_K", "blk.38.attn_gate.weight": "Q6_K", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q6_K", "blk.38.ffn_down_exps.weight": "IQ4_XS", "blk.38.ffn_down_shexp.weight": "Q6_K", "blk.38.ffn_gate_exps.weight": "IQ2_S", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "Q6_K", "blk.38.ffn_up_exps.weight": "IQ2_S", "blk.38.ffn_up_shexp.weight": "Q6_K", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "F32", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "Q6_K", "blk.39.attn_k.weight": "Q6_K", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "Q6_K", "blk.39.attn_q.weight": "Q6_K", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q6_K", "blk.39.ffn_down_exps.weight": "IQ4_XS", "blk.39.ffn_down_shexp.weight": "Q6_K", "blk.39.ffn_gate_exps.weight": "IQ2_S", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "Q6_K", "blk.39.ffn_up_exps.weight": "IQ2_S", "blk.39.ffn_up_shexp.weight": "Q6_K", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "Q6_K", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q6_K", "blk.4.ffn_down_exps.weight": "IQ3_S", "blk.4.ffn_down_shexp.weight": "Q6_K", "blk.4.ffn_gate_exps.weight": "IQ2_S", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "Q6_K", "blk.4.ffn_up_exps.weight": "IQ2_S", "blk.4.ffn_up_shexp.weight": "Q6_K", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "F32", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "Q6_K", "blk.5.attn_gate.weight": "Q6_K", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q6_K", "blk.5.ffn_down_exps.weight": "IQ3_S", "blk.5.ffn_down_shexp.weight": "Q6_K", "blk.5.ffn_gate_exps.weight": "IQ2_S", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "Q6_K", "blk.5.ffn_up_exps.weight": "IQ2_S", "blk.5.ffn_up_shexp.weight": "Q6_K", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "F32", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "Q6_K", "blk.6.attn_gate.weight": "Q6_K", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q6_K", "blk.6.ffn_down_exps.weight": "IQ3_S", "blk.6.ffn_down_shexp.weight": "Q6_K", "blk.6.ffn_gate_exps.weight": "IQ2_S", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "Q6_K", "blk.6.ffn_up_exps.weight": "IQ2_S", "blk.6.ffn_up_shexp.weight": "Q6_K", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "F32", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "Q6_K", "blk.7.attn_k.weight": "Q6_K", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "Q6_K", "blk.7.attn_q.weight": "Q6_K", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q6_K", "blk.7.ffn_down_exps.weight": "IQ3_S", "blk.7.ffn_down_shexp.weight": "Q6_K", "blk.7.ffn_gate_exps.weight": "IQ2_S", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "Q6_K", "blk.7.ffn_up_exps.weight": "IQ2_S", "blk.7.ffn_up_shexp.weight": "Q6_K", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "Q6_K", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q6_K", "blk.8.ffn_down_exps.weight": "IQ3_S", "blk.8.ffn_down_shexp.weight": "Q6_K", "blk.8.ffn_gate_exps.weight": "IQ2_S", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "Q6_K", "blk.8.ffn_up_exps.weight": "IQ2_S", "blk.8.ffn_up_shexp.weight": "Q6_K", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "F32", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "Q6_K", "blk.9.attn_gate.weight": "Q6_K", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q6_K", "blk.9.ffn_down_exps.weight": "IQ3_S", "blk.9.ffn_down_shexp.weight": "Q6_K", "blk.9.ffn_gate_exps.weight": "IQ2_S", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "Q6_K", "blk.9.ffn_up_exps.weight": "IQ2_S", "blk.9.ffn_up_shexp.weight": "Q6_K", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "F32", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "Q6_K", "output.weight": "Q6_K", "output_norm.weight": "F32", "token_embd.weight": "Q6_K" } }, { "FileName": "Qwen3.6-35B-A3B-MQ-IQ2_XXS_1.gguf", "DisplayName": "MQ-IQ2_XXS_1", "ShortName": "MQ-IQ2_XXS_1", "Provider": "MagicQuant", "QuantFamily": "IQ2_XXS", "BaseQuant": "IQ2_XXS", "IsHybrid": true, "UsedImatrix": true, "SourceKld": 0.27513, "SourcePpl": 7.049514, "SourcePplDeltaPercent": 23.958396342535607, "SourceSizeBytes": 9587160480, "SourceSizeGB": 9.58716048, "SourceSizeGiB": 8.928738981485367, "TensorTypes": { "blk.0.attn_gate.weight": "IQ2_XXS", "blk.0.attn_norm.weight": "F32", "blk.0.attn_qkv.weight": "Q5_K", "blk.0.ffn_down_exps.weight": "Q2_K", "blk.0.ffn_down_shexp.weight": "Q2_K", "blk.0.ffn_gate_exps.weight": "IQ2_XXS", "blk.0.ffn_gate_inp.weight": "F32", "blk.0.ffn_gate_inp_shexp.weight": "F32", "blk.0.ffn_gate_shexp.weight": "IQ2_XXS", "blk.0.ffn_up_exps.weight": "IQ2_XXS", "blk.0.ffn_up_shexp.weight": "IQ2_XXS", "blk.0.post_attention_norm.weight": "F32", "blk.0.ssm_a": "F32", "blk.0.ssm_alpha.weight": "F32", "blk.0.ssm_beta.weight": "IQ2_XXS", "blk.0.ssm_conv1d.weight": "F32", "blk.0.ssm_dt.bias": "F32", "blk.0.ssm_norm.weight": "F32", "blk.0.ssm_out.weight": "IQ2_XXS", "blk.1.attn_gate.weight": "IQ2_XXS", "blk.1.attn_norm.weight": "F32", "blk.1.attn_qkv.weight": "Q5_K", "blk.1.ffn_down_exps.weight": "Q2_K", "blk.1.ffn_down_shexp.weight": "Q2_K", "blk.1.ffn_gate_exps.weight": "IQ2_XXS", "blk.1.ffn_gate_inp.weight": "F32", "blk.1.ffn_gate_inp_shexp.weight": "F32", "blk.1.ffn_gate_shexp.weight": "IQ2_XXS", "blk.1.ffn_up_exps.weight": "IQ2_XXS", "blk.1.ffn_up_shexp.weight": "IQ2_XXS", "blk.1.post_attention_norm.weight": "F32", "blk.1.ssm_a": "F32", "blk.1.ssm_alpha.weight": "F32", "blk.1.ssm_beta.weight": "IQ2_XXS", "blk.1.ssm_conv1d.weight": "F32", "blk.1.ssm_dt.bias": "F32", "blk.1.ssm_norm.weight": "F32", "blk.1.ssm_out.weight": "IQ2_XXS", "blk.10.attn_gate.weight": "IQ2_XXS", "blk.10.attn_norm.weight": "F32", "blk.10.attn_qkv.weight": "Q4_K", "blk.10.ffn_down_exps.weight": "IQ2_XXS", "blk.10.ffn_down_shexp.weight": "IQ2_XXS", "blk.10.ffn_gate_exps.weight": "IQ2_XXS", "blk.10.ffn_gate_inp.weight": "F32", "blk.10.ffn_gate_inp_shexp.weight": "F32", "blk.10.ffn_gate_shexp.weight": "IQ2_XXS", "blk.10.ffn_up_exps.weight": "IQ2_XXS", "blk.10.ffn_up_shexp.weight": "IQ2_XXS", "blk.10.post_attention_norm.weight": "F32", "blk.10.ssm_a": "F32", "blk.10.ssm_alpha.weight": "F32", "blk.10.ssm_beta.weight": "IQ2_XXS", "blk.10.ssm_conv1d.weight": "F32", "blk.10.ssm_dt.bias": "F32", "blk.10.ssm_norm.weight": "F32", "blk.10.ssm_out.weight": "IQ2_XXS", "blk.11.attn_k.weight": "IQ3_S", "blk.11.attn_k_norm.weight": "F32", "blk.11.attn_norm.weight": "F32", "blk.11.attn_output.weight": "IQ4_XS", "blk.11.attn_q.weight": "Q4_K", "blk.11.attn_q_norm.weight": "F32", "blk.11.attn_v.weight": "Q4_K", "blk.11.ffn_down_exps.weight": "IQ2_XXS", "blk.11.ffn_down_shexp.weight": "IQ2_XXS", "blk.11.ffn_gate_exps.weight": "IQ2_XXS", "blk.11.ffn_gate_inp.weight": "F32", "blk.11.ffn_gate_inp_shexp.weight": "F32", "blk.11.ffn_gate_shexp.weight": "IQ2_XXS", "blk.11.ffn_up_exps.weight": "IQ2_XXS", "blk.11.ffn_up_shexp.weight": "IQ2_XXS", "blk.11.post_attention_norm.weight": "F32", "blk.12.attn_gate.weight": "IQ2_XXS", "blk.12.attn_norm.weight": "F32", "blk.12.attn_qkv.weight": "Q4_K", "blk.12.ffn_down_exps.weight": "IQ2_XXS", "blk.12.ffn_down_shexp.weight": "IQ2_XXS", "blk.12.ffn_gate_exps.weight": "IQ2_XXS", "blk.12.ffn_gate_inp.weight": "F32", "blk.12.ffn_gate_inp_shexp.weight": "F32", "blk.12.ffn_gate_shexp.weight": "IQ2_XXS", "blk.12.ffn_up_exps.weight": "IQ2_XXS", "blk.12.ffn_up_shexp.weight": "IQ2_XXS", "blk.12.post_attention_norm.weight": "F32", "blk.12.ssm_a": "F32", "blk.12.ssm_alpha.weight": "F32", "blk.12.ssm_beta.weight": "IQ2_XXS", "blk.12.ssm_conv1d.weight": "F32", "blk.12.ssm_dt.bias": "F32", "blk.12.ssm_norm.weight": "F32", "blk.12.ssm_out.weight": "IQ2_XXS", "blk.13.attn_gate.weight": "IQ2_XXS", "blk.13.attn_norm.weight": "F32", "blk.13.attn_qkv.weight": "Q4_K", "blk.13.ffn_down_exps.weight": "IQ2_XXS", "blk.13.ffn_down_shexp.weight": "IQ2_XXS", "blk.13.ffn_gate_exps.weight": "IQ2_XXS", "blk.13.ffn_gate_inp.weight": "F32", "blk.13.ffn_gate_inp_shexp.weight": "F32", "blk.13.ffn_gate_shexp.weight": "IQ2_XXS", "blk.13.ffn_up_exps.weight": "IQ2_XXS", "blk.13.ffn_up_shexp.weight": "IQ2_XXS", "blk.13.post_attention_norm.weight": "F32", "blk.13.ssm_a": "F32", "blk.13.ssm_alpha.weight": "F32", "blk.13.ssm_beta.weight": "IQ2_XXS", "blk.13.ssm_conv1d.weight": "F32", "blk.13.ssm_dt.bias": "F32", "blk.13.ssm_norm.weight": "F32", "blk.13.ssm_out.weight": "IQ2_XXS", "blk.14.attn_gate.weight": "IQ2_XXS", "blk.14.attn_norm.weight": "F32", "blk.14.attn_qkv.weight": "Q4_K", "blk.14.ffn_down_exps.weight": "IQ2_XXS", "blk.14.ffn_down_shexp.weight": "IQ2_XXS", "blk.14.ffn_gate_exps.weight": "IQ2_XXS", "blk.14.ffn_gate_inp.weight": "F32", "blk.14.ffn_gate_inp_shexp.weight": "F32", "blk.14.ffn_gate_shexp.weight": "IQ2_XXS", "blk.14.ffn_up_exps.weight": "IQ2_XXS", "blk.14.ffn_up_shexp.weight": "IQ2_XXS", "blk.14.post_attention_norm.weight": "F32", "blk.14.ssm_a": "F32", "blk.14.ssm_alpha.weight": "F32", "blk.14.ssm_beta.weight": "IQ2_XXS", "blk.14.ssm_conv1d.weight": "F32", "blk.14.ssm_dt.bias": "F32", "blk.14.ssm_norm.weight": "F32", "blk.14.ssm_out.weight": "IQ2_XXS", "blk.15.attn_k.weight": "IQ3_S", "blk.15.attn_k_norm.weight": "F32", "blk.15.attn_norm.weight": "F32", "blk.15.attn_output.weight": "IQ4_XS", "blk.15.attn_q.weight": "Q4_K", "blk.15.attn_q_norm.weight": "F32", "blk.15.attn_v.weight": "Q4_K", "blk.15.ffn_down_exps.weight": "IQ2_XXS", "blk.15.ffn_down_shexp.weight": "IQ2_XXS", "blk.15.ffn_gate_exps.weight": "IQ2_XXS", "blk.15.ffn_gate_inp.weight": "F32", "blk.15.ffn_gate_inp_shexp.weight": "F32", "blk.15.ffn_gate_shexp.weight": "IQ2_XXS", "blk.15.ffn_up_exps.weight": "IQ2_XXS", "blk.15.ffn_up_shexp.weight": "IQ2_XXS", "blk.15.post_attention_norm.weight": "F32", "blk.16.attn_gate.weight": "IQ2_XXS", "blk.16.attn_norm.weight": "F32", "blk.16.attn_qkv.weight": "Q4_K", "blk.16.ffn_down_exps.weight": "IQ2_XXS", "blk.16.ffn_down_shexp.weight": "IQ2_XXS", "blk.16.ffn_gate_exps.weight": "IQ2_XXS", "blk.16.ffn_gate_inp.weight": "F32", "blk.16.ffn_gate_inp_shexp.weight": "F32", "blk.16.ffn_gate_shexp.weight": "IQ2_XXS", "blk.16.ffn_up_exps.weight": "IQ2_XXS", "blk.16.ffn_up_shexp.weight": "IQ2_XXS", "blk.16.post_attention_norm.weight": "F32", "blk.16.ssm_a": "F32", "blk.16.ssm_alpha.weight": "F32", "blk.16.ssm_beta.weight": "IQ2_XXS", "blk.16.ssm_conv1d.weight": "F32", "blk.16.ssm_dt.bias": "F32", "blk.16.ssm_norm.weight": "F32", "blk.16.ssm_out.weight": "IQ2_XXS", "blk.17.attn_gate.weight": "IQ2_XXS", "blk.17.attn_norm.weight": "F32", "blk.17.attn_qkv.weight": "Q4_K", "blk.17.ffn_down_exps.weight": "IQ2_XXS", "blk.17.ffn_down_shexp.weight": "IQ2_XXS", "blk.17.ffn_gate_exps.weight": "IQ2_XXS", "blk.17.ffn_gate_inp.weight": "F32", "blk.17.ffn_gate_inp_shexp.weight": "F32", "blk.17.ffn_gate_shexp.weight": "IQ2_XXS", "blk.17.ffn_up_exps.weight": "IQ2_XXS", "blk.17.ffn_up_shexp.weight": "IQ2_XXS", "blk.17.post_attention_norm.weight": "F32", "blk.17.ssm_a": "F32", "blk.17.ssm_alpha.weight": "F32", "blk.17.ssm_beta.weight": "IQ2_XXS", "blk.17.ssm_conv1d.weight": "F32", "blk.17.ssm_dt.bias": "F32", "blk.17.ssm_norm.weight": "F32", "blk.17.ssm_out.weight": "IQ2_XXS", "blk.18.attn_gate.weight": "IQ2_XXS", "blk.18.attn_norm.weight": "F32", "blk.18.attn_qkv.weight": "Q4_K", "blk.18.ffn_down_exps.weight": "IQ2_XXS", "blk.18.ffn_down_shexp.weight": "IQ2_XXS", "blk.18.ffn_gate_exps.weight": "IQ2_XXS", "blk.18.ffn_gate_inp.weight": "F32", "blk.18.ffn_gate_inp_shexp.weight": "F32", "blk.18.ffn_gate_shexp.weight": "IQ2_XXS", "blk.18.ffn_up_exps.weight": "IQ2_XXS", "blk.18.ffn_up_shexp.weight": "IQ2_XXS", "blk.18.post_attention_norm.weight": "F32", "blk.18.ssm_a": "F32", "blk.18.ssm_alpha.weight": "F32", "blk.18.ssm_beta.weight": "IQ2_XXS", "blk.18.ssm_conv1d.weight": "F32", "blk.18.ssm_dt.bias": "F32", "blk.18.ssm_norm.weight": "F32", "blk.18.ssm_out.weight": "IQ2_XXS", "blk.19.attn_k.weight": "IQ3_S", "blk.19.attn_k_norm.weight": "F32", "blk.19.attn_norm.weight": "F32", "blk.19.attn_output.weight": "IQ4_XS", "blk.19.attn_q.weight": "Q4_K", "blk.19.attn_q_norm.weight": "F32", "blk.19.attn_v.weight": "Q4_K", "blk.19.ffn_down_exps.weight": "IQ2_XXS", "blk.19.ffn_down_shexp.weight": "IQ2_XXS", "blk.19.ffn_gate_exps.weight": "IQ2_XXS", "blk.19.ffn_gate_inp.weight": "F32", "blk.19.ffn_gate_inp_shexp.weight": "F32", "blk.19.ffn_gate_shexp.weight": "IQ2_XXS", "blk.19.ffn_up_exps.weight": "IQ2_XXS", "blk.19.ffn_up_shexp.weight": "IQ2_XXS", "blk.19.post_attention_norm.weight": "F32", "blk.2.attn_gate.weight": "IQ2_XXS", "blk.2.attn_norm.weight": "F32", "blk.2.attn_qkv.weight": "Q5_K", "blk.2.ffn_down_exps.weight": "Q2_K", "blk.2.ffn_down_shexp.weight": "IQ2_XXS", "blk.2.ffn_gate_exps.weight": "IQ2_XXS", "blk.2.ffn_gate_inp.weight": "F32", "blk.2.ffn_gate_inp_shexp.weight": "F32", "blk.2.ffn_gate_shexp.weight": "IQ2_XXS", "blk.2.ffn_up_exps.weight": "IQ2_XXS", "blk.2.ffn_up_shexp.weight": "IQ2_XXS", "blk.2.post_attention_norm.weight": "F32", "blk.2.ssm_a": "F32", "blk.2.ssm_alpha.weight": "F32", "blk.2.ssm_beta.weight": "IQ2_XXS", "blk.2.ssm_conv1d.weight": "F32", "blk.2.ssm_dt.bias": "F32", "blk.2.ssm_norm.weight": "F32", "blk.2.ssm_out.weight": "IQ2_XXS", "blk.20.attn_gate.weight": "IQ2_XXS", "blk.20.attn_norm.weight": "F32", "blk.20.attn_qkv.weight": "Q4_K", "blk.20.ffn_down_exps.weight": "IQ2_XXS", "blk.20.ffn_down_shexp.weight": "IQ2_XXS", "blk.20.ffn_gate_exps.weight": "IQ2_XXS", "blk.20.ffn_gate_inp.weight": "F32", "blk.20.ffn_gate_inp_shexp.weight": "F32", "blk.20.ffn_gate_shexp.weight": "IQ2_XXS", "blk.20.ffn_up_exps.weight": "IQ2_XXS", "blk.20.ffn_up_shexp.weight": "IQ2_XXS", "blk.20.post_attention_norm.weight": "F32", "blk.20.ssm_a": "F32", "blk.20.ssm_alpha.weight": "F32", "blk.20.ssm_beta.weight": "IQ2_XXS", "blk.20.ssm_conv1d.weight": "F32", "blk.20.ssm_dt.bias": "F32", "blk.20.ssm_norm.weight": "F32", "blk.20.ssm_out.weight": "IQ2_XXS", "blk.21.attn_gate.weight": "IQ2_XXS", "blk.21.attn_norm.weight": "F32", "blk.21.attn_qkv.weight": "Q4_K", "blk.21.ffn_down_exps.weight": "IQ2_XXS", "blk.21.ffn_down_shexp.weight": "IQ2_XXS", "blk.21.ffn_gate_exps.weight": "IQ2_XXS", "blk.21.ffn_gate_inp.weight": "F32", "blk.21.ffn_gate_inp_shexp.weight": "F32", "blk.21.ffn_gate_shexp.weight": "IQ2_XXS", "blk.21.ffn_up_exps.weight": "IQ2_XXS", "blk.21.ffn_up_shexp.weight": "IQ2_XXS", "blk.21.post_attention_norm.weight": "F32", "blk.21.ssm_a": "F32", "blk.21.ssm_alpha.weight": "F32", "blk.21.ssm_beta.weight": "IQ2_XXS", "blk.21.ssm_conv1d.weight": "F32", "blk.21.ssm_dt.bias": "F32", "blk.21.ssm_norm.weight": "F32", "blk.21.ssm_out.weight": "IQ2_XXS", "blk.22.attn_gate.weight": "IQ2_XXS", "blk.22.attn_norm.weight": "F32", "blk.22.attn_qkv.weight": "Q4_K", "blk.22.ffn_down_exps.weight": "IQ2_XXS", "blk.22.ffn_down_shexp.weight": "IQ2_XXS", "blk.22.ffn_gate_exps.weight": "IQ2_XXS", "blk.22.ffn_gate_inp.weight": "F32", "blk.22.ffn_gate_inp_shexp.weight": "F32", "blk.22.ffn_gate_shexp.weight": "IQ2_XXS", "blk.22.ffn_up_exps.weight": "IQ2_XXS", "blk.22.ffn_up_shexp.weight": "IQ2_XXS", "blk.22.post_attention_norm.weight": "F32", "blk.22.ssm_a": "F32", "blk.22.ssm_alpha.weight": "F32", "blk.22.ssm_beta.weight": "IQ2_XXS", "blk.22.ssm_conv1d.weight": "F32", "blk.22.ssm_dt.bias": "F32", "blk.22.ssm_norm.weight": "F32", "blk.22.ssm_out.weight": "IQ2_XXS", "blk.23.attn_k.weight": "IQ3_S", "blk.23.attn_k_norm.weight": "F32", "blk.23.attn_norm.weight": "F32", "blk.23.attn_output.weight": "IQ4_XS", "blk.23.attn_q.weight": "Q4_K", "blk.23.attn_q_norm.weight": "F32", "blk.23.attn_v.weight": "Q4_K", "blk.23.ffn_down_exps.weight": "IQ2_XXS", "blk.23.ffn_down_shexp.weight": "IQ2_XXS", "blk.23.ffn_gate_exps.weight": "IQ2_XXS", "blk.23.ffn_gate_inp.weight": "F32", "blk.23.ffn_gate_inp_shexp.weight": "F32", "blk.23.ffn_gate_shexp.weight": "IQ2_XXS", "blk.23.ffn_up_exps.weight": "IQ2_XXS", "blk.23.ffn_up_shexp.weight": "IQ2_XXS", "blk.23.post_attention_norm.weight": "F32", "blk.24.attn_gate.weight": "IQ2_XXS", "blk.24.attn_norm.weight": "F32", "blk.24.attn_qkv.weight": "Q4_K", "blk.24.ffn_down_exps.weight": "IQ2_XXS", "blk.24.ffn_down_shexp.weight": "IQ2_XXS", "blk.24.ffn_gate_exps.weight": "IQ2_XXS", "blk.24.ffn_gate_inp.weight": "F32", "blk.24.ffn_gate_inp_shexp.weight": "F32", "blk.24.ffn_gate_shexp.weight": "IQ2_XXS", "blk.24.ffn_up_exps.weight": "IQ2_XXS", "blk.24.ffn_up_shexp.weight": "IQ2_XXS", "blk.24.post_attention_norm.weight": "F32", "blk.24.ssm_a": "F32", "blk.24.ssm_alpha.weight": "F32", "blk.24.ssm_beta.weight": "IQ2_XXS", "blk.24.ssm_conv1d.weight": "F32", "blk.24.ssm_dt.bias": "F32", "blk.24.ssm_norm.weight": "F32", "blk.24.ssm_out.weight": "IQ2_XXS", "blk.25.attn_gate.weight": "IQ2_XXS", "blk.25.attn_norm.weight": "F32", "blk.25.attn_qkv.weight": "Q4_K", "blk.25.ffn_down_exps.weight": "IQ2_XXS", "blk.25.ffn_down_shexp.weight": "IQ2_XXS", "blk.25.ffn_gate_exps.weight": "IQ2_XXS", "blk.25.ffn_gate_inp.weight": "F32", "blk.25.ffn_gate_inp_shexp.weight": "F32", "blk.25.ffn_gate_shexp.weight": "IQ2_XXS", "blk.25.ffn_up_exps.weight": "IQ2_XXS", "blk.25.ffn_up_shexp.weight": "IQ2_XXS", "blk.25.post_attention_norm.weight": "F32", "blk.25.ssm_a": "F32", "blk.25.ssm_alpha.weight": "F32", "blk.25.ssm_beta.weight": "IQ2_XXS", "blk.25.ssm_conv1d.weight": "F32", "blk.25.ssm_dt.bias": "F32", "blk.25.ssm_norm.weight": "F32", "blk.25.ssm_out.weight": "IQ2_XXS", "blk.26.attn_gate.weight": "IQ2_XXS", "blk.26.attn_norm.weight": "F32", "blk.26.attn_qkv.weight": "Q4_K", "blk.26.ffn_down_exps.weight": "IQ2_XXS", "blk.26.ffn_down_shexp.weight": "IQ2_XXS", "blk.26.ffn_gate_exps.weight": "IQ2_XXS", "blk.26.ffn_gate_inp.weight": "F32", "blk.26.ffn_gate_inp_shexp.weight": "F32", "blk.26.ffn_gate_shexp.weight": "IQ2_XXS", "blk.26.ffn_up_exps.weight": "IQ2_XXS", "blk.26.ffn_up_shexp.weight": "IQ2_XXS", "blk.26.post_attention_norm.weight": "F32", "blk.26.ssm_a": "F32", "blk.26.ssm_alpha.weight": "F32", "blk.26.ssm_beta.weight": "IQ2_XXS", "blk.26.ssm_conv1d.weight": "F32", "blk.26.ssm_dt.bias": "F32", "blk.26.ssm_norm.weight": "F32", "blk.26.ssm_out.weight": "IQ2_XXS", "blk.27.attn_k.weight": "IQ3_S", "blk.27.attn_k_norm.weight": "F32", "blk.27.attn_norm.weight": "F32", "blk.27.attn_output.weight": "IQ4_XS", "blk.27.attn_q.weight": "Q4_K", "blk.27.attn_q_norm.weight": "F32", "blk.27.attn_v.weight": "Q4_K", "blk.27.ffn_down_exps.weight": "IQ2_XXS", "blk.27.ffn_down_shexp.weight": "IQ2_XXS", "blk.27.ffn_gate_exps.weight": "IQ2_XXS", "blk.27.ffn_gate_inp.weight": "F32", "blk.27.ffn_gate_inp_shexp.weight": "F32", "blk.27.ffn_gate_shexp.weight": "IQ2_XXS", "blk.27.ffn_up_exps.weight": "IQ2_XXS", "blk.27.ffn_up_shexp.weight": "IQ2_XXS", "blk.27.post_attention_norm.weight": "F32", "blk.28.attn_gate.weight": "IQ2_XXS", "blk.28.attn_norm.weight": "F32", "blk.28.attn_qkv.weight": "Q4_K", "blk.28.ffn_down_exps.weight": "IQ2_XXS", "blk.28.ffn_down_shexp.weight": "IQ2_XXS", "blk.28.ffn_gate_exps.weight": "IQ2_XXS", "blk.28.ffn_gate_inp.weight": "F32", "blk.28.ffn_gate_inp_shexp.weight": "F32", "blk.28.ffn_gate_shexp.weight": "IQ2_XXS", "blk.28.ffn_up_exps.weight": "IQ2_XXS", "blk.28.ffn_up_shexp.weight": "IQ2_XXS", "blk.28.post_attention_norm.weight": "F32", "blk.28.ssm_a": "F32", "blk.28.ssm_alpha.weight": "F32", "blk.28.ssm_beta.weight": "IQ2_XXS", "blk.28.ssm_conv1d.weight": "F32", "blk.28.ssm_dt.bias": "F32", "blk.28.ssm_norm.weight": "F32", "blk.28.ssm_out.weight": "IQ2_XXS", "blk.29.attn_gate.weight": "IQ2_XXS", "blk.29.attn_norm.weight": "F32", "blk.29.attn_qkv.weight": "Q4_K", "blk.29.ffn_down_exps.weight": "IQ2_XXS", "blk.29.ffn_down_shexp.weight": "IQ2_XXS", "blk.29.ffn_gate_exps.weight": "IQ2_XXS", "blk.29.ffn_gate_inp.weight": "F32", "blk.29.ffn_gate_inp_shexp.weight": "F32", "blk.29.ffn_gate_shexp.weight": "IQ2_XXS", "blk.29.ffn_up_exps.weight": "IQ2_XXS", "blk.29.ffn_up_shexp.weight": "IQ2_XXS", "blk.29.post_attention_norm.weight": "F32", "blk.29.ssm_a": "F32", "blk.29.ssm_alpha.weight": "F32", "blk.29.ssm_beta.weight": "IQ2_XXS", "blk.29.ssm_conv1d.weight": "F32", "blk.29.ssm_dt.bias": "F32", "blk.29.ssm_norm.weight": "F32", "blk.29.ssm_out.weight": "IQ2_XXS", "blk.3.attn_k.weight": "IQ3_S", "blk.3.attn_k_norm.weight": "F32", "blk.3.attn_norm.weight": "F32", "blk.3.attn_output.weight": "IQ4_XS", "blk.3.attn_q.weight": "Q4_K", "blk.3.attn_q_norm.weight": "F32", "blk.3.attn_v.weight": "Q4_K", "blk.3.ffn_down_exps.weight": "IQ2_XXS", "blk.3.ffn_down_shexp.weight": "IQ2_XXS", "blk.3.ffn_gate_exps.weight": "IQ2_XXS", "blk.3.ffn_gate_inp.weight": "F32", "blk.3.ffn_gate_inp_shexp.weight": "F32", "blk.3.ffn_gate_shexp.weight": "IQ2_XXS", "blk.3.ffn_up_exps.weight": "IQ2_XXS", "blk.3.ffn_up_shexp.weight": "IQ2_XXS", "blk.3.post_attention_norm.weight": "F32", "blk.30.attn_gate.weight": "IQ2_XXS", "blk.30.attn_norm.weight": "F32", "blk.30.attn_qkv.weight": "Q4_K", "blk.30.ffn_down_exps.weight": "IQ2_XXS", "blk.30.ffn_down_shexp.weight": "IQ2_XXS", "blk.30.ffn_gate_exps.weight": "IQ2_XXS", "blk.30.ffn_gate_inp.weight": "F32", "blk.30.ffn_gate_inp_shexp.weight": "F32", "blk.30.ffn_gate_shexp.weight": "IQ2_XXS", "blk.30.ffn_up_exps.weight": "IQ2_XXS", "blk.30.ffn_up_shexp.weight": "IQ2_XXS", "blk.30.post_attention_norm.weight": "F32", "blk.30.ssm_a": "F32", "blk.30.ssm_alpha.weight": "F32", "blk.30.ssm_beta.weight": "IQ2_XXS", "blk.30.ssm_conv1d.weight": "F32", "blk.30.ssm_dt.bias": "F32", "blk.30.ssm_norm.weight": "F32", "blk.30.ssm_out.weight": "IQ2_XXS", "blk.31.attn_k.weight": "IQ3_S", "blk.31.attn_k_norm.weight": "F32", "blk.31.attn_norm.weight": "F32", "blk.31.attn_output.weight": "IQ4_XS", "blk.31.attn_q.weight": "Q4_K", "blk.31.attn_q_norm.weight": "F32", "blk.31.attn_v.weight": "Q4_K", "blk.31.ffn_down_exps.weight": "IQ2_XXS", "blk.31.ffn_down_shexp.weight": "IQ2_XXS", "blk.31.ffn_gate_exps.weight": "IQ2_XXS", "blk.31.ffn_gate_inp.weight": "F32", "blk.31.ffn_gate_inp_shexp.weight": "F32", "blk.31.ffn_gate_shexp.weight": "IQ2_XXS", "blk.31.ffn_up_exps.weight": "IQ2_XXS", "blk.31.ffn_up_shexp.weight": "IQ2_XXS", "blk.31.post_attention_norm.weight": "F32", "blk.32.attn_gate.weight": "IQ2_XXS", "blk.32.attn_norm.weight": "F32", "blk.32.attn_qkv.weight": "Q4_K", "blk.32.ffn_down_exps.weight": "IQ2_XXS", "blk.32.ffn_down_shexp.weight": "IQ2_XXS", "blk.32.ffn_gate_exps.weight": "IQ2_XXS", "blk.32.ffn_gate_inp.weight": "F32", "blk.32.ffn_gate_inp_shexp.weight": "F32", "blk.32.ffn_gate_shexp.weight": "IQ2_XXS", "blk.32.ffn_up_exps.weight": "IQ2_XXS", "blk.32.ffn_up_shexp.weight": "IQ2_XXS", "blk.32.post_attention_norm.weight": "F32", "blk.32.ssm_a": "F32", "blk.32.ssm_alpha.weight": "F32", "blk.32.ssm_beta.weight": "IQ2_XXS", "blk.32.ssm_conv1d.weight": "F32", "blk.32.ssm_dt.bias": "F32", "blk.32.ssm_norm.weight": "F32", "blk.32.ssm_out.weight": "IQ2_XXS", "blk.33.attn_gate.weight": "IQ2_XXS", "blk.33.attn_norm.weight": "F32", "blk.33.attn_qkv.weight": "Q4_K", "blk.33.ffn_down_exps.weight": "IQ2_XXS", "blk.33.ffn_down_shexp.weight": "IQ2_XXS", "blk.33.ffn_gate_exps.weight": "IQ2_XXS", "blk.33.ffn_gate_inp.weight": "F32", "blk.33.ffn_gate_inp_shexp.weight": "F32", "blk.33.ffn_gate_shexp.weight": "IQ2_XXS", "blk.33.ffn_up_exps.weight": "IQ2_XXS", "blk.33.ffn_up_shexp.weight": "IQ2_XXS", "blk.33.post_attention_norm.weight": "F32", "blk.33.ssm_a": "F32", "blk.33.ssm_alpha.weight": "F32", "blk.33.ssm_beta.weight": "IQ2_XXS", "blk.33.ssm_conv1d.weight": "F32", "blk.33.ssm_dt.bias": "F32", "blk.33.ssm_norm.weight": "F32", "blk.33.ssm_out.weight": "IQ2_XXS", "blk.34.attn_gate.weight": "IQ2_XXS", "blk.34.attn_norm.weight": "F32", "blk.34.attn_qkv.weight": "Q4_K", "blk.34.ffn_down_exps.weight": "IQ2_XXS", "blk.34.ffn_down_shexp.weight": "IQ2_XXS", "blk.34.ffn_gate_exps.weight": "IQ2_XXS", "blk.34.ffn_gate_inp.weight": "F32", "blk.34.ffn_gate_inp_shexp.weight": "F32", "blk.34.ffn_gate_shexp.weight": "IQ2_XXS", "blk.34.ffn_up_exps.weight": "IQ2_XXS", "blk.34.ffn_up_shexp.weight": "IQ2_XXS", "blk.34.post_attention_norm.weight": "F32", "blk.34.ssm_a": "F32", "blk.34.ssm_alpha.weight": "F32", "blk.34.ssm_beta.weight": "IQ2_XXS", "blk.34.ssm_conv1d.weight": "F32", "blk.34.ssm_dt.bias": "F32", "blk.34.ssm_norm.weight": "F32", "blk.34.ssm_out.weight": "IQ2_XXS", "blk.35.attn_k.weight": "IQ3_S", "blk.35.attn_k_norm.weight": "F32", "blk.35.attn_norm.weight": "F32", "blk.35.attn_output.weight": "IQ4_XS", "blk.35.attn_q.weight": "Q4_K", "blk.35.attn_q_norm.weight": "F32", "blk.35.attn_v.weight": "Q4_K", "blk.35.ffn_down_exps.weight": "IQ2_XXS", "blk.35.ffn_down_shexp.weight": "IQ2_XXS", "blk.35.ffn_gate_exps.weight": "IQ2_XXS", "blk.35.ffn_gate_inp.weight": "F32", "blk.35.ffn_gate_inp_shexp.weight": "F32", "blk.35.ffn_gate_shexp.weight": "IQ2_XXS", "blk.35.ffn_up_exps.weight": "IQ2_XXS", "blk.35.ffn_up_shexp.weight": "IQ2_XXS", "blk.35.post_attention_norm.weight": "F32", "blk.36.attn_gate.weight": "IQ2_XXS", "blk.36.attn_norm.weight": "F32", "blk.36.attn_qkv.weight": "Q4_K", "blk.36.ffn_down_exps.weight": "IQ2_XXS", "blk.36.ffn_down_shexp.weight": "IQ2_XXS", "blk.36.ffn_gate_exps.weight": "IQ2_XXS", "blk.36.ffn_gate_inp.weight": "F32", "blk.36.ffn_gate_inp_shexp.weight": "F32", "blk.36.ffn_gate_shexp.weight": "IQ2_XXS", "blk.36.ffn_up_exps.weight": "IQ2_XXS", "blk.36.ffn_up_shexp.weight": "IQ2_XXS", "blk.36.post_attention_norm.weight": "F32", "blk.36.ssm_a": "F32", "blk.36.ssm_alpha.weight": "F32", "blk.36.ssm_beta.weight": "IQ2_XXS", "blk.36.ssm_conv1d.weight": "F32", "blk.36.ssm_dt.bias": "F32", "blk.36.ssm_norm.weight": "F32", "blk.36.ssm_out.weight": "IQ2_XXS", "blk.37.attn_gate.weight": "IQ2_XXS", "blk.37.attn_norm.weight": "F32", "blk.37.attn_qkv.weight": "Q4_K", "blk.37.ffn_down_exps.weight": "IQ2_XXS", "blk.37.ffn_down_shexp.weight": "IQ2_XXS", "blk.37.ffn_gate_exps.weight": "IQ2_XXS", "blk.37.ffn_gate_inp.weight": "F32", "blk.37.ffn_gate_inp_shexp.weight": "F32", "blk.37.ffn_gate_shexp.weight": "IQ2_XXS", "blk.37.ffn_up_exps.weight": "IQ2_XXS", "blk.37.ffn_up_shexp.weight": "IQ2_XXS", "blk.37.post_attention_norm.weight": "F32", "blk.37.ssm_a": "F32", "blk.37.ssm_alpha.weight": "F32", "blk.37.ssm_beta.weight": "IQ2_XXS", "blk.37.ssm_conv1d.weight": "F32", "blk.37.ssm_dt.bias": "F32", "blk.37.ssm_norm.weight": "F32", "blk.37.ssm_out.weight": "IQ2_XXS", "blk.38.attn_gate.weight": "IQ2_XXS", "blk.38.attn_norm.weight": "F32", "blk.38.attn_qkv.weight": "Q4_K", "blk.38.ffn_down_exps.weight": "IQ2_XXS", "blk.38.ffn_down_shexp.weight": "IQ2_XXS", "blk.38.ffn_gate_exps.weight": "IQ2_XXS", "blk.38.ffn_gate_inp.weight": "F32", "blk.38.ffn_gate_inp_shexp.weight": "F32", "blk.38.ffn_gate_shexp.weight": "IQ2_XXS", "blk.38.ffn_up_exps.weight": "IQ2_XXS", "blk.38.ffn_up_shexp.weight": "IQ2_XXS", "blk.38.post_attention_norm.weight": "F32", "blk.38.ssm_a": "F32", "blk.38.ssm_alpha.weight": "F32", "blk.38.ssm_beta.weight": "IQ2_XXS", "blk.38.ssm_conv1d.weight": "F32", "blk.38.ssm_dt.bias": "F32", "blk.38.ssm_norm.weight": "F32", "blk.38.ssm_out.weight": "IQ2_XXS", "blk.39.attn_k.weight": "IQ3_S", "blk.39.attn_k_norm.weight": "F32", "blk.39.attn_norm.weight": "F32", "blk.39.attn_output.weight": "IQ4_XS", "blk.39.attn_q.weight": "Q4_K", "blk.39.attn_q_norm.weight": "F32", "blk.39.attn_v.weight": "Q4_K", "blk.39.ffn_down_exps.weight": "IQ2_XXS", "blk.39.ffn_down_shexp.weight": "IQ2_XXS", "blk.39.ffn_gate_exps.weight": "IQ2_XXS", "blk.39.ffn_gate_inp.weight": "F32", "blk.39.ffn_gate_inp_shexp.weight": "F32", "blk.39.ffn_gate_shexp.weight": "IQ2_XXS", "blk.39.ffn_up_exps.weight": "IQ2_XXS", "blk.39.ffn_up_shexp.weight": "IQ2_XXS", "blk.39.post_attention_norm.weight": "F32", "blk.4.attn_gate.weight": "IQ2_XXS", "blk.4.attn_norm.weight": "F32", "blk.4.attn_qkv.weight": "Q4_K", "blk.4.ffn_down_exps.weight": "IQ2_XXS", "blk.4.ffn_down_shexp.weight": "IQ2_XXS", "blk.4.ffn_gate_exps.weight": "IQ2_XXS", "blk.4.ffn_gate_inp.weight": "F32", "blk.4.ffn_gate_inp_shexp.weight": "F32", "blk.4.ffn_gate_shexp.weight": "IQ2_XXS", "blk.4.ffn_up_exps.weight": "IQ2_XXS", "blk.4.ffn_up_shexp.weight": "IQ2_XXS", "blk.4.post_attention_norm.weight": "F32", "blk.4.ssm_a": "F32", "blk.4.ssm_alpha.weight": "F32", "blk.4.ssm_beta.weight": "IQ2_XXS", "blk.4.ssm_conv1d.weight": "F32", "blk.4.ssm_dt.bias": "F32", "blk.4.ssm_norm.weight": "F32", "blk.4.ssm_out.weight": "IQ2_XXS", "blk.5.attn_gate.weight": "IQ2_XXS", "blk.5.attn_norm.weight": "F32", "blk.5.attn_qkv.weight": "Q4_K", "blk.5.ffn_down_exps.weight": "IQ2_XXS", "blk.5.ffn_down_shexp.weight": "IQ2_XXS", "blk.5.ffn_gate_exps.weight": "IQ2_XXS", "blk.5.ffn_gate_inp.weight": "F32", "blk.5.ffn_gate_inp_shexp.weight": "F32", "blk.5.ffn_gate_shexp.weight": "IQ2_XXS", "blk.5.ffn_up_exps.weight": "IQ2_XXS", "blk.5.ffn_up_shexp.weight": "IQ2_XXS", "blk.5.post_attention_norm.weight": "F32", "blk.5.ssm_a": "F32", "blk.5.ssm_alpha.weight": "F32", "blk.5.ssm_beta.weight": "IQ2_XXS", "blk.5.ssm_conv1d.weight": "F32", "blk.5.ssm_dt.bias": "F32", "blk.5.ssm_norm.weight": "F32", "blk.5.ssm_out.weight": "IQ2_XXS", "blk.6.attn_gate.weight": "IQ2_XXS", "blk.6.attn_norm.weight": "F32", "blk.6.attn_qkv.weight": "Q4_K", "blk.6.ffn_down_exps.weight": "IQ2_XXS", "blk.6.ffn_down_shexp.weight": "IQ2_XXS", "blk.6.ffn_gate_exps.weight": "IQ2_XXS", "blk.6.ffn_gate_inp.weight": "F32", "blk.6.ffn_gate_inp_shexp.weight": "F32", "blk.6.ffn_gate_shexp.weight": "IQ2_XXS", "blk.6.ffn_up_exps.weight": "IQ2_XXS", "blk.6.ffn_up_shexp.weight": "IQ2_XXS", "blk.6.post_attention_norm.weight": "F32", "blk.6.ssm_a": "F32", "blk.6.ssm_alpha.weight": "F32", "blk.6.ssm_beta.weight": "IQ2_XXS", "blk.6.ssm_conv1d.weight": "F32", "blk.6.ssm_dt.bias": "F32", "blk.6.ssm_norm.weight": "F32", "blk.6.ssm_out.weight": "IQ2_XXS", "blk.7.attn_k.weight": "IQ3_S", "blk.7.attn_k_norm.weight": "F32", "blk.7.attn_norm.weight": "F32", "blk.7.attn_output.weight": "IQ4_XS", "blk.7.attn_q.weight": "Q4_K", "blk.7.attn_q_norm.weight": "F32", "blk.7.attn_v.weight": "Q4_K", "blk.7.ffn_down_exps.weight": "IQ2_XXS", "blk.7.ffn_down_shexp.weight": "IQ2_XXS", "blk.7.ffn_gate_exps.weight": "IQ2_XXS", "blk.7.ffn_gate_inp.weight": "F32", "blk.7.ffn_gate_inp_shexp.weight": "F32", "blk.7.ffn_gate_shexp.weight": "IQ2_XXS", "blk.7.ffn_up_exps.weight": "IQ2_XXS", "blk.7.ffn_up_shexp.weight": "IQ2_XXS", "blk.7.post_attention_norm.weight": "F32", "blk.8.attn_gate.weight": "IQ2_XXS", "blk.8.attn_norm.weight": "F32", "blk.8.attn_qkv.weight": "Q4_K", "blk.8.ffn_down_exps.weight": "IQ2_XXS", "blk.8.ffn_down_shexp.weight": "IQ2_XXS", "blk.8.ffn_gate_exps.weight": "IQ2_XXS", "blk.8.ffn_gate_inp.weight": "F32", "blk.8.ffn_gate_inp_shexp.weight": "F32", "blk.8.ffn_gate_shexp.weight": "IQ2_XXS", "blk.8.ffn_up_exps.weight": "IQ2_XXS", "blk.8.ffn_up_shexp.weight": "IQ2_XXS", "blk.8.post_attention_norm.weight": "F32", "blk.8.ssm_a": "F32", "blk.8.ssm_alpha.weight": "F32", "blk.8.ssm_beta.weight": "IQ2_XXS", "blk.8.ssm_conv1d.weight": "F32", "blk.8.ssm_dt.bias": "F32", "blk.8.ssm_norm.weight": "F32", "blk.8.ssm_out.weight": "IQ2_XXS", "blk.9.attn_gate.weight": "IQ2_XXS", "blk.9.attn_norm.weight": "F32", "blk.9.attn_qkv.weight": "Q4_K", "blk.9.ffn_down_exps.weight": "IQ2_XXS", "blk.9.ffn_down_shexp.weight": "IQ2_XXS", "blk.9.ffn_gate_exps.weight": "IQ2_XXS", "blk.9.ffn_gate_inp.weight": "F32", "blk.9.ffn_gate_inp_shexp.weight": "F32", "blk.9.ffn_gate_shexp.weight": "IQ2_XXS", "blk.9.ffn_up_exps.weight": "IQ2_XXS", "blk.9.ffn_up_shexp.weight": "IQ2_XXS", "blk.9.post_attention_norm.weight": "F32", "blk.9.ssm_a": "F32", "blk.9.ssm_alpha.weight": "F32", "blk.9.ssm_beta.weight": "IQ2_XXS", "blk.9.ssm_conv1d.weight": "F32", "blk.9.ssm_dt.bias": "F32", "blk.9.ssm_norm.weight": "F32", "blk.9.ssm_out.weight": "IQ2_XXS", "output.weight": "Q5_K", "output_norm.weight": "F32", "token_embd.weight": "Q2_K" } } ] }