free02/ glm5.1:part6

149 1 month ago

43060415fd85 · 37GB
    Metadata
  • split.count
    6
  • split.no
    5
  • split.tensors.count
    1809
  • Tensor
    blk.67
  • blk.67.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.67.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.67.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.67.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.67.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.67.ffn_norm.weight
    F32
    [6144]
  • blk.67.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.67.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.67.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.67.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.67.indexer.k_norm.bias
    F32
    [128]
  • blk.67.indexer.k_norm.weight
    F32
    [128]
  • blk.67.indexer.proj.weight
    F32
    [6144, 32]
  • blk.68
  • blk.68.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.68.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.68.attn_kv_a_norm.weight
    F32
    [512]
  • blk.68.attn_norm.weight
    F32
    [6144]
  • blk.68.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.68.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.68.attn_q_a_norm.weight
    F32
    [2048]
  • blk.68.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.68.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.68.exp_probs_b.bias
    F32
    [256]
  • blk.68.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.68.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.68.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.68.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.68.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.68.ffn_norm.weight
    F32
    [6144]
  • blk.68.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.68.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.68.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.68.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.68.indexer.k_norm.bias
    F32
    [128]
  • blk.68.indexer.k_norm.weight
    F32
    [128]
  • blk.68.indexer.proj.weight
    F32
    [6144, 32]
  • blk.69
  • blk.69.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.69.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.69.attn_kv_a_norm.weight
    F32
    [512]
  • blk.69.attn_norm.weight
    F32
    [6144]
  • blk.69.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.69.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.69.attn_q_a_norm.weight
    F32
    [2048]
  • blk.69.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.69.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.69.exp_probs_b.bias
    F32
    [256]
  • blk.69.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.69.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.69.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.69.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.69.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.69.ffn_norm.weight
    F32
    [6144]
  • blk.69.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.69.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.69.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.69.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.69.indexer.k_norm.bias
    F32
    [128]
  • blk.69.indexer.k_norm.weight
    F32
    [128]
  • blk.69.indexer.proj.weight
    F32
    [6144, 32]
  • blk.70
  • blk.70.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.70.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.70.attn_kv_a_norm.weight
    F32
    [512]
  • blk.70.attn_norm.weight
    F32
    [6144]
  • blk.70.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.70.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.70.attn_q_a_norm.weight
    F32
    [2048]
  • blk.70.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.70.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.70.exp_probs_b.bias
    F32
    [256]
  • blk.70.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.70.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.70.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.70.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.70.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.70.ffn_norm.weight
    F32
    [6144]
  • blk.70.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.70.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.70.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.70.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.70.indexer.k_norm.bias
    F32
    [128]
  • blk.70.indexer.k_norm.weight
    F32
    [128]
  • blk.70.indexer.proj.weight
    F32
    [6144, 32]
  • blk.71
  • blk.71.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.71.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.71.attn_kv_a_norm.weight
    F32
    [512]
  • blk.71.attn_norm.weight
    F32
    [6144]
  • blk.71.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.71.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.71.attn_q_a_norm.weight
    F32
    [2048]
  • blk.71.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.71.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.71.exp_probs_b.bias
    F32
    [256]
  • blk.71.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.71.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.71.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.71.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.71.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.71.ffn_norm.weight
    F32
    [6144]
  • blk.71.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.71.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.71.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.71.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.71.indexer.k_norm.bias
    F32
    [128]
  • blk.71.indexer.k_norm.weight
    F32
    [128]
  • blk.71.indexer.proj.weight
    F32
    [6144, 32]
  • blk.72
  • blk.72.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.72.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.72.attn_kv_a_norm.weight
    F32
    [512]
  • blk.72.attn_norm.weight
    F32
    [6144]
  • blk.72.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.72.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.72.attn_q_a_norm.weight
    F32
    [2048]
  • blk.72.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.72.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.72.exp_probs_b.bias
    F32
    [256]
  • blk.72.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.72.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.72.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.72.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.72.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.72.ffn_norm.weight
    F32
    [6144]
  • blk.72.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.72.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.72.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.72.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.72.indexer.k_norm.bias
    F32
    [128]
  • blk.72.indexer.k_norm.weight
    F32
    [128]
  • blk.72.indexer.proj.weight
    F32
    [6144, 32]
  • blk.73
  • blk.73.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.73.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.73.attn_kv_a_norm.weight
    F32
    [512]
  • blk.73.attn_norm.weight
    F32
    [6144]
  • blk.73.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.73.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.73.attn_q_a_norm.weight
    F32
    [2048]
  • blk.73.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.73.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.73.exp_probs_b.bias
    F32
    [256]
  • blk.73.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.73.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.73.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.73.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.73.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.73.ffn_norm.weight
    F32
    [6144]
  • blk.73.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.73.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.73.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.73.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.73.indexer.k_norm.bias
    F32
    [128]
  • blk.73.indexer.k_norm.weight
    F32
    [128]
  • blk.73.indexer.proj.weight
    F32
    [6144, 32]
  • blk.74
  • blk.74.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.74.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.74.attn_kv_a_norm.weight
    F32
    [512]
  • blk.74.attn_norm.weight
    F32
    [6144]
  • blk.74.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.74.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.74.attn_q_a_norm.weight
    F32
    [2048]
  • blk.74.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.74.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.74.exp_probs_b.bias
    F32
    [256]
  • blk.74.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.74.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.74.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.74.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.74.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.74.ffn_norm.weight
    F32
    [6144]
  • blk.74.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.74.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.74.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.74.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.74.indexer.k_norm.bias
    F32
    [128]
  • blk.74.indexer.k_norm.weight
    F32
    [128]
  • blk.74.indexer.proj.weight
    F32
    [6144, 32]
  • blk.75
  • blk.75.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.75.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.75.attn_kv_a_norm.weight
    F32
    [512]
  • blk.75.attn_norm.weight
    F32
    [6144]
  • blk.75.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.75.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.75.attn_q_a_norm.weight
    F32
    [2048]
  • blk.75.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.75.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.75.exp_probs_b.bias
    F32
    [256]
  • blk.75.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.75.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.75.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.75.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.75.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.75.ffn_norm.weight
    F32
    [6144]
  • blk.75.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.75.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.75.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.75.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.75.indexer.k_norm.bias
    F32
    [128]
  • blk.75.indexer.k_norm.weight
    F32
    [128]
  • blk.75.indexer.proj.weight
    F32
    [6144, 32]
  • blk.76
  • blk.76.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.76.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.76.attn_kv_a_norm.weight
    F32
    [512]
  • blk.76.attn_norm.weight
    F32
    [6144]
  • blk.76.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.76.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.76.attn_q_a_norm.weight
    F32
    [2048]
  • blk.76.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.76.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.76.exp_probs_b.bias
    F32
    [256]
  • blk.76.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.76.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.76.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.76.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.76.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.76.ffn_norm.weight
    F32
    [6144]
  • blk.76.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.76.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.76.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.76.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.76.indexer.k_norm.bias
    F32
    [128]
  • blk.76.indexer.k_norm.weight
    F32
    [128]
  • blk.76.indexer.proj.weight
    F32
    [6144, 32]
  • blk.77
  • blk.77.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.77.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.77.attn_kv_a_norm.weight
    F32
    [512]
  • blk.77.attn_norm.weight
    F32
    [6144]
  • blk.77.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.77.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.77.attn_q_a_norm.weight
    F32
    [2048]
  • blk.77.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.77.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.77.exp_probs_b.bias
    F32
    [256]
  • blk.77.ffn_down_exps.weight
    IQ3_XXS
    [2048, 6144, 256]
  • blk.77.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.77.ffn_gate_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.77.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.77.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.77.ffn_norm.weight
    F32
    [6144]
  • blk.77.ffn_up_exps.weight
    IQ2_XXS
    [6144, 2048, 256]
  • blk.77.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.77.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.77.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.77.indexer.k_norm.bias
    F32
    [128]
  • blk.77.indexer.k_norm.weight
    F32
    [128]
  • blk.77.indexer.proj.weight
    F32
    [6144, 32]
  • blk.78
  • blk.78.attn_k_b.weight
    Q8_0
    [192, 512, 64]
  • blk.78.attn_kv_a_mqa.weight
    Q8_0
    [6144, 576]
  • blk.78.attn_kv_a_norm.weight
    F32
    [512]
  • blk.78.attn_norm.weight
    F32
    [6144]
  • blk.78.attn_output.weight
    Q5_K
    [16384, 6144]
  • blk.78.attn_q_a.weight
    Q5_K
    [6144, 2048]
  • blk.78.attn_q_a_norm.weight
    F32
    [2048]
  • blk.78.attn_q_b.weight
    Q8_0
    [2048, 16384]
  • blk.78.attn_v_b.weight
    Q8_0
    [512, 256, 64]
  • blk.78.exp_probs_b.bias
    F32
    [256]
  • blk.78.ffn_down_exps.weight
    Q3_K
    [2048, 6144, 256]
  • blk.78.ffn_down_shexp.weight
    Q6_K
    [2048, 6144]
  • blk.78.ffn_gate_exps.weight
    Q2_K
    [6144, 2048, 256]
  • blk.78.ffn_gate_inp.weight
    F32
    [6144, 256]
  • blk.78.ffn_gate_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.78.ffn_norm.weight
    F32
    [6144]
  • blk.78.ffn_up_exps.weight
    Q2_K
    [6144, 2048, 256]
  • blk.78.ffn_up_shexp.weight
    Q5_K
    [6144, 2048]
  • blk.78.indexer.attn_k.weight
    Q8_0
    [6144, 128]
  • blk.78.indexer.attn_q_b.weight
    Q8_0
    [2048, 4096]
  • blk.78.indexer.k_norm.bias
    F32
    [128]
  • blk.78.indexer.k_norm.weight
    F32
    [128]
  • blk.78.indexer.proj.weight
    F32
    [6144, 32]
  • blk.78.nextn.eh_proj.weight
    Q2_K
    [12288, 6144]
  • blk.78.nextn.enorm.weight
    F32
    [6144]
  • blk.78.nextn.hnorm.weight
    F32
    [6144]
  • blk.78.nextn.shared_head_norm.weight
    F32
    [6144]