Models
Docs
Pricing
Sign in
Download
Models
Download
Docs
Pricing
Sign in
free02
/
glm5.1
:part4
149
Downloads
Updated
1 month ago
Cancel
glm5.1:part4
...
/
model
39cc900489af · 50GB
Metadata
split.count
6
6
split.no
3
3
split.tensors.count
1809
1809
Tensor
Name
Type
Shape
blk.34
blk.34.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.34.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.34.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.34.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.34.indexer.k_norm.bias
F32
F32
[128]
blk.34.indexer.k_norm.weight
F32
F32
[128]
blk.34.indexer.proj.weight
F32
F32
[6144, 32]
blk.35
blk.35.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.35.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.35.attn_kv_a_norm.weight
F32
F32
[512]
blk.35.attn_norm.weight
F32
F32
[6144]
blk.35.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.35.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.35.attn_q_a_norm.weight
F32
F32
[2048]
blk.35.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.35.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.35.exp_probs_b.bias
F32
F32
[256]
blk.35.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.35.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.35.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.35.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.35.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.35.ffn_norm.weight
F32
F32
[6144]
blk.35.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.35.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.35.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.35.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.35.indexer.k_norm.bias
F32
F32
[128]
blk.35.indexer.k_norm.weight
F32
F32
[128]
blk.35.indexer.proj.weight
F32
F32
[6144, 32]
blk.36
blk.36.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.36.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.36.attn_kv_a_norm.weight
F32
F32
[512]
blk.36.attn_norm.weight
F32
F32
[6144]
blk.36.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.36.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.36.attn_q_a_norm.weight
F32
F32
[2048]
blk.36.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.36.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.36.exp_probs_b.bias
F32
F32
[256]
blk.36.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.36.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.36.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.36.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.36.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.36.ffn_norm.weight
F32
F32
[6144]
blk.36.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.36.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.36.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.36.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.36.indexer.k_norm.bias
F32
F32
[128]
blk.36.indexer.k_norm.weight
F32
F32
[128]
blk.36.indexer.proj.weight
F32
F32
[6144, 32]
blk.37
blk.37.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.37.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.37.attn_kv_a_norm.weight
F32
F32
[512]
blk.37.attn_norm.weight
F32
F32
[6144]
blk.37.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.37.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.37.attn_q_a_norm.weight
F32
F32
[2048]
blk.37.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.37.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.37.exp_probs_b.bias
F32
F32
[256]
blk.37.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.37.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.37.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.37.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.37.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.37.ffn_norm.weight
F32
F32
[6144]
blk.37.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.37.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.37.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.37.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.37.indexer.k_norm.bias
F32
F32
[128]
blk.37.indexer.k_norm.weight
F32
F32
[128]
blk.37.indexer.proj.weight
F32
F32
[6144, 32]
blk.38
blk.38.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.38.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.38.attn_kv_a_norm.weight
F32
F32
[512]
blk.38.attn_norm.weight
F32
F32
[6144]
blk.38.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.38.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.38.attn_q_a_norm.weight
F32
F32
[2048]
blk.38.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.38.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.38.exp_probs_b.bias
F32
F32
[256]
blk.38.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.38.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.38.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.38.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.38.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.38.ffn_norm.weight
F32
F32
[6144]
blk.38.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.38.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.38.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.38.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.38.indexer.k_norm.bias
F32
F32
[128]
blk.38.indexer.k_norm.weight
F32
F32
[128]
blk.38.indexer.proj.weight
F32
F32
[6144, 32]
blk.39
blk.39.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.39.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.39.attn_kv_a_norm.weight
F32
F32
[512]
blk.39.attn_norm.weight
F32
F32
[6144]
blk.39.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.39.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.39.attn_q_a_norm.weight
F32
F32
[2048]
blk.39.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.39.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.39.exp_probs_b.bias
F32
F32
[256]
blk.39.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.39.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.39.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.39.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.39.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.39.ffn_norm.weight
F32
F32
[6144]
blk.39.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.39.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.39.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.39.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.39.indexer.k_norm.bias
F32
F32
[128]
blk.39.indexer.k_norm.weight
F32
F32
[128]
blk.39.indexer.proj.weight
F32
F32
[6144, 32]
blk.40
blk.40.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.40.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.40.attn_kv_a_norm.weight
F32
F32
[512]
blk.40.attn_norm.weight
F32
F32
[6144]
blk.40.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.40.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.40.attn_q_a_norm.weight
F32
F32
[2048]
blk.40.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.40.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.40.exp_probs_b.bias
F32
F32
[256]
blk.40.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.40.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.40.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.40.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.40.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.40.ffn_norm.weight
F32
F32
[6144]
blk.40.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.40.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.40.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.40.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.40.indexer.k_norm.bias
F32
F32
[128]
blk.40.indexer.k_norm.weight
F32
F32
[128]
blk.40.indexer.proj.weight
F32
F32
[6144, 32]
blk.41
blk.41.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.41.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.41.attn_kv_a_norm.weight
F32
F32
[512]
blk.41.attn_norm.weight
F32
F32
[6144]
blk.41.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.41.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.41.attn_q_a_norm.weight
F32
F32
[2048]
blk.41.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.41.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.41.exp_probs_b.bias
F32
F32
[256]
blk.41.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.41.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.41.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.41.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.41.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.41.ffn_norm.weight
F32
F32
[6144]
blk.41.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.41.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.41.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.41.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.41.indexer.k_norm.bias
F32
F32
[128]
blk.41.indexer.k_norm.weight
F32
F32
[128]
blk.41.indexer.proj.weight
F32
F32
[6144, 32]
blk.42
blk.42.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.42.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.42.attn_kv_a_norm.weight
F32
F32
[512]
blk.42.attn_norm.weight
F32
F32
[6144]
blk.42.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.42.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.42.attn_q_a_norm.weight
F32
F32
[2048]
blk.42.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.42.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.42.exp_probs_b.bias
F32
F32
[256]
blk.42.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.42.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.42.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.42.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.42.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.42.ffn_norm.weight
F32
F32
[6144]
blk.42.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.42.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.42.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.42.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.42.indexer.k_norm.bias
F32
F32
[128]
blk.42.indexer.k_norm.weight
F32
F32
[128]
blk.42.indexer.proj.weight
F32
F32
[6144, 32]
blk.43
blk.43.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.43.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.43.attn_kv_a_norm.weight
F32
F32
[512]
blk.43.attn_norm.weight
F32
F32
[6144]
blk.43.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.43.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.43.attn_q_a_norm.weight
F32
F32
[2048]
blk.43.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.43.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.43.exp_probs_b.bias
F32
F32
[256]
blk.43.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.43.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.43.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.43.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.43.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.43.ffn_norm.weight
F32
F32
[6144]
blk.43.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.43.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.43.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.43.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.43.indexer.k_norm.bias
F32
F32
[128]
blk.43.indexer.k_norm.weight
F32
F32
[128]
blk.43.indexer.proj.weight
F32
F32
[6144, 32]
blk.44
blk.44.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.44.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.44.attn_kv_a_norm.weight
F32
F32
[512]
blk.44.attn_norm.weight
F32
F32
[6144]
blk.44.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.44.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.44.attn_q_a_norm.weight
F32
F32
[2048]
blk.44.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.44.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.44.exp_probs_b.bias
F32
F32
[256]
blk.44.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.44.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.44.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.44.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.44.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.44.ffn_norm.weight
F32
F32
[6144]
blk.44.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.44.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.44.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.44.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.44.indexer.k_norm.bias
F32
F32
[128]
blk.44.indexer.k_norm.weight
F32
F32
[128]
blk.44.indexer.proj.weight
F32
F32
[6144, 32]
blk.45
blk.45.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.45.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.45.attn_kv_a_norm.weight
F32
F32
[512]
blk.45.attn_norm.weight
F32
F32
[6144]
blk.45.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.45.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.45.attn_q_a_norm.weight
F32
F32
[2048]
blk.45.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.45.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.45.exp_probs_b.bias
F32
F32
[256]
blk.45.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.45.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.45.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.45.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.45.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.45.ffn_norm.weight
F32
F32
[6144]
blk.45.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.45.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.45.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.45.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.45.indexer.k_norm.bias
F32
F32
[128]
blk.45.indexer.k_norm.weight
F32
F32
[128]
blk.45.indexer.proj.weight
F32
F32
[6144, 32]
blk.46
blk.46.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.46.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.46.attn_kv_a_norm.weight
F32
F32
[512]
blk.46.attn_norm.weight
F32
F32
[6144]
blk.46.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.46.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.46.attn_q_a_norm.weight
F32
F32
[2048]
blk.46.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.46.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.46.exp_probs_b.bias
F32
F32
[256]
blk.46.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.46.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.46.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.46.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.46.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.46.ffn_norm.weight
F32
F32
[6144]
blk.46.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.46.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.46.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.46.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.46.indexer.k_norm.bias
F32
F32
[128]
blk.46.indexer.k_norm.weight
F32
F32
[128]
blk.46.indexer.proj.weight
F32
F32
[6144, 32]
blk.47
blk.47.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.47.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.47.attn_kv_a_norm.weight
F32
F32
[512]
blk.47.attn_norm.weight
F32
F32
[6144]
blk.47.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.47.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.47.attn_q_a_norm.weight
F32
F32
[2048]
blk.47.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.47.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.47.exp_probs_b.bias
F32
F32
[256]
blk.47.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.47.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.47.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.47.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.47.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.47.ffn_norm.weight
F32
F32
[6144]
blk.47.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.47.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.47.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.47.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.47.indexer.k_norm.bias
F32
F32
[128]
blk.47.indexer.k_norm.weight
F32
F32
[128]
blk.47.indexer.proj.weight
F32
F32
[6144, 32]
blk.48
blk.48.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.48.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.48.attn_kv_a_norm.weight
F32
F32
[512]
blk.48.attn_norm.weight
F32
F32
[6144]
blk.48.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.48.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.48.attn_q_a_norm.weight
F32
F32
[2048]
blk.48.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.48.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.48.exp_probs_b.bias
F32
F32
[256]
blk.48.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.48.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.48.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.48.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.48.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.48.ffn_norm.weight
F32
F32
[6144]
blk.48.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.48.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.48.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.48.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.48.indexer.k_norm.bias
F32
F32
[128]
blk.48.indexer.k_norm.weight
F32
F32
[128]
blk.48.indexer.proj.weight
F32
F32
[6144, 32]
blk.49
blk.49.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.49.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.49.attn_kv_a_norm.weight
F32
F32
[512]
blk.49.attn_norm.weight
F32
F32
[6144]
blk.49.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.49.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.49.attn_q_a_norm.weight
F32
F32
[2048]
blk.49.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.49.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.49.exp_probs_b.bias
F32
F32
[256]
blk.49.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.49.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.49.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.49.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.49.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.49.ffn_norm.weight
F32
F32
[6144]
blk.49.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.49.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.49.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.49.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.49.indexer.k_norm.bias
F32
F32
[128]
blk.49.indexer.k_norm.weight
F32
F32
[128]
blk.49.indexer.proj.weight
F32
F32
[6144, 32]
blk.50
blk.50.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]
blk.50.attn_kv_a_mqa.weight
Q8_0
Q8_0
[6144, 576]
blk.50.attn_kv_a_norm.weight
F32
F32
[512]
blk.50.attn_norm.weight
F32
F32
[6144]
blk.50.attn_output.weight
Q5_K
Q5_K
[16384, 6144]
blk.50.attn_q_a.weight
Q5_K
Q5_K
[6144, 2048]
blk.50.attn_q_a_norm.weight
F32
F32
[2048]
blk.50.attn_q_b.weight
Q8_0
Q8_0
[2048, 16384]
blk.50.attn_v_b.weight
Q8_0
Q8_0
[512, 256, 64]
blk.50.exp_probs_b.bias
F32
F32
[256]
blk.50.ffn_down_exps.weight
IQ3_XXS
IQ3_XXS
[2048, 6144, 256]
blk.50.ffn_down_shexp.weight
Q6_K
Q6_K
[2048, 6144]
blk.50.ffn_gate_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.50.ffn_gate_inp.weight
F32
F32
[6144, 256]
blk.50.ffn_gate_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.50.ffn_norm.weight
F32
F32
[6144]
blk.50.ffn_up_exps.weight
IQ2_XXS
IQ2_XXS
[6144, 2048, 256]
blk.50.ffn_up_shexp.weight
Q5_K
Q5_K
[6144, 2048]
blk.50.indexer.attn_k.weight
Q8_0
Q8_0
[6144, 128]
blk.50.indexer.attn_q_b.weight
Q8_0
Q8_0
[2048, 4096]
blk.50.indexer.k_norm.bias
F32
F32
[128]
blk.50.indexer.k_norm.weight
F32
F32
[128]
blk.50.indexer.proj.weight
F32
F32
[6144, 32]
blk.51
blk.51.attn_k_b.weight
Q8_0
Q8_0
[192, 512, 64]