Qwen2.5 models are pretrained on Alibaba's latest large-scale dataset, encompassing up to 18 trillion tokens. The model supports up to 128K tokens and has multilingual support.

Tools 0.5B 1.5B 3B 7B 14B 32B 72B

66.6K Pulls Updated 11 hours ago

133 Tags

dd60673d4ffd · 77GB
    Metadata
  • general.architecture
    qwen2
  • general.file_type
    Q8_0
  • qwen2.attention.head_count
    64
  • qwen2.attention.head_count_kv
    8
  • qwen2.attention.layer_norm_rms_epsilon
    1e-06
  • qwen2.block_count
    80
  • qwen2.context_length
    32768
  • qwen2.embedding_length
    8192
  • qwen2.feed_forward_length
    29568
  • qwen2.rope.freq_base
    1e+06
  • tokenizer.ggml.add_bos_token
    false
  • tokenizer.ggml.bos_token_id
    151643
  • tokenizer.ggml.eos_token_id
    151645
  • tokenizer.ggml.merges
    [Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
  • tokenizer.ggml.model
    gpt2
  • tokenizer.ggml.padding_token_id
    151643
  • tokenizer.ggml.pre
    qwen2
  • tokenizer.ggml.token_type
    [1 1 1 1 1 ...]
  • tokenizer.ggml.tokens
    [! " # $ % ...]
  • Tensors
  • Name
    Type
    Shape
  • token_embd.weight
    Q8_0
    [8192 152064]
  • blk.0
  • blk.0.attn_norm.weight
    F32
    [8192]
  • blk.0.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.0.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.0.ffn_norm.weight
    F32
    [8192]
  • blk.0.attn_k.bias
    F32
    [1024]
  • blk.0.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.0.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.0.attn_q.bias
    F32
    [8192]
  • blk.0.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.0.attn_v.bias
    F32
    [1024]
  • blk.0.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.0.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.1
  • blk.1.attn_norm.weight
    F32
    [8192]
  • blk.1.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.1.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.1.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.1.ffn_norm.weight
    F32
    [8192]
  • blk.1.attn_k.bias
    F32
    [1024]
  • blk.1.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.1.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.1.attn_q.bias
    F32
    [8192]
  • blk.1.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.1.attn_v.bias
    F32
    [1024]
  • blk.1.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.2
  • blk.2.attn_norm.weight
    F32
    [8192]
  • blk.2.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.2.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.2.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.2.ffn_norm.weight
    F32
    [8192]
  • blk.2.attn_k.bias
    F32
    [1024]
  • blk.2.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.2.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.2.attn_q.bias
    F32
    [8192]
  • blk.2.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.2.attn_v.bias
    F32
    [1024]
  • blk.2.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.3
  • blk.3.attn_norm.weight
    F32
    [8192]
  • blk.3.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.3.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.3.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.3.ffn_norm.weight
    F32
    [8192]
  • blk.3.attn_k.bias
    F32
    [1024]
  • blk.3.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.3.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.3.attn_q.bias
    F32
    [8192]
  • blk.3.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.3.attn_v.bias
    F32
    [1024]
  • blk.3.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.4
  • blk.4.attn_norm.weight
    F32
    [8192]
  • blk.4.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.4.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.4.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.4.ffn_norm.weight
    F32
    [8192]
  • blk.4.attn_k.bias
    F32
    [1024]
  • blk.4.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.4.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.4.attn_q.bias
    F32
    [8192]
  • blk.4.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.4.attn_v.bias
    F32
    [1024]
  • blk.4.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.5
  • blk.5.attn_norm.weight
    F32
    [8192]
  • blk.5.ffn_norm.weight
    F32
    [8192]
  • blk.5.attn_k.bias
    F32
    [1024]
  • blk.5.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.5.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.5.attn_q.bias
    F32
    [8192]
  • blk.5.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.5.attn_v.bias
    F32
    [1024]
  • blk.5.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.5.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.5.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.5.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.6
  • blk.6.attn_norm.weight
    F32
    [8192]
  • blk.6.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.6.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.6.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.6.ffn_norm.weight
    F32
    [8192]
  • blk.6.attn_k.bias
    F32
    [1024]
  • blk.6.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.6.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.6.attn_q.bias
    F32
    [8192]
  • blk.6.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.6.attn_v.bias
    F32
    [1024]
  • blk.6.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.7
  • blk.7.attn_norm.weight
    F32
    [8192]
  • blk.7.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.7.ffn_norm.weight
    F32
    [8192]
  • blk.7.attn_k.bias
    F32
    [1024]
  • blk.7.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.7.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.7.attn_q.bias
    F32
    [8192]
  • blk.7.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.7.attn_v.bias
    F32
    [1024]
  • blk.7.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.7.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.7.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.8
  • blk.8.attn_norm.weight
    F32
    [8192]
  • blk.8.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.8.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.8.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.8.ffn_norm.weight
    F32
    [8192]
  • blk.8.attn_k.bias
    F32
    [1024]
  • blk.8.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.8.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.8.attn_q.bias
    F32
    [8192]
  • blk.8.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.8.attn_v.bias
    F32
    [1024]
  • blk.8.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.9
  • blk.9.attn_norm.weight
    F32
    [8192]
  • blk.9.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.9.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.9.ffn_norm.weight
    F32
    [8192]
  • blk.9.attn_k.bias
    F32
    [1024]
  • blk.9.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.9.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.9.attn_q.bias
    F32
    [8192]
  • blk.9.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.9.attn_v.bias
    F32
    [1024]
  • blk.9.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.9.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.10
  • blk.10.attn_norm.weight
    F32
    [8192]
  • blk.10.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.10.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.10.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.10.ffn_norm.weight
    F32
    [8192]
  • blk.10.attn_k.bias
    F32
    [1024]
  • blk.10.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.10.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.10.attn_q.bias
    F32
    [8192]
  • blk.10.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.10.attn_v.bias
    F32
    [1024]
  • blk.10.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.11
  • blk.11.attn_norm.weight
    F32
    [8192]
  • blk.11.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.11.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.11.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.11.ffn_norm.weight
    F32
    [8192]
  • blk.11.attn_k.bias
    F32
    [1024]
  • blk.11.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.11.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.11.attn_q.bias
    F32
    [8192]
  • blk.11.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.11.attn_v.bias
    F32
    [1024]
  • blk.11.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.12
  • blk.12.attn_norm.weight
    F32
    [8192]
  • blk.12.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.12.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.12.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.12.ffn_norm.weight
    F32
    [8192]
  • blk.12.attn_k.bias
    F32
    [1024]
  • blk.12.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.12.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.12.attn_q.bias
    F32
    [8192]
  • blk.12.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.12.attn_v.bias
    F32
    [1024]
  • blk.12.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.13
  • blk.13.attn_norm.weight
    F32
    [8192]
  • blk.13.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.13.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.13.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.13.ffn_norm.weight
    F32
    [8192]
  • blk.13.attn_k.bias
    F32
    [1024]
  • blk.13.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.13.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.13.attn_q.bias
    F32
    [8192]
  • blk.13.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.13.attn_v.bias
    F32
    [1024]
  • blk.13.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.14
  • blk.14.attn_norm.weight
    F32
    [8192]
  • blk.14.ffn_norm.weight
    F32
    [8192]
  • blk.14.attn_k.bias
    F32
    [1024]
  • blk.14.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.14.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.14.attn_q.bias
    F32
    [8192]
  • blk.14.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.14.attn_v.bias
    F32
    [1024]
  • blk.14.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.14.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.14.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.14.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.15
  • blk.15.attn_norm.weight
    F32
    [8192]
  • blk.15.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.15.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.15.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.15.ffn_norm.weight
    F32
    [8192]
  • blk.15.attn_k.bias
    F32
    [1024]
  • blk.15.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.15.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.15.attn_q.bias
    F32
    [8192]
  • blk.15.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.15.attn_v.bias
    F32
    [1024]
  • blk.15.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.16
  • blk.16.attn_norm.weight
    F32
    [8192]
  • blk.16.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.16.ffn_norm.weight
    F32
    [8192]
  • blk.16.attn_k.bias
    F32
    [1024]
  • blk.16.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.16.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.16.attn_q.bias
    F32
    [8192]
  • blk.16.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.16.attn_v.bias
    F32
    [1024]
  • blk.16.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.16.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.16.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.17
  • blk.17.attn_norm.weight
    F32
    [8192]
  • blk.17.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.17.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.17.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.17.ffn_norm.weight
    F32
    [8192]
  • blk.17.attn_k.bias
    F32
    [1024]
  • blk.17.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.17.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.17.attn_q.bias
    F32
    [8192]
  • blk.17.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.17.attn_v.bias
    F32
    [1024]
  • blk.17.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.18
  • blk.18.attn_norm.weight
    F32
    [8192]
  • blk.18.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.18.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.18.ffn_norm.weight
    F32
    [8192]
  • blk.18.attn_k.bias
    F32
    [1024]
  • blk.18.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.18.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.18.attn_q.bias
    F32
    [8192]
  • blk.18.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.18.attn_v.bias
    F32
    [1024]
  • blk.18.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.18.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.19
  • blk.19.attn_norm.weight
    F32
    [8192]
  • blk.19.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.19.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.19.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.19.ffn_norm.weight
    F32
    [8192]
  • blk.19.attn_k.bias
    F32
    [1024]
  • blk.19.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.19.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.19.attn_q.bias
    F32
    [8192]
  • blk.19.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.19.attn_v.bias
    F32
    [1024]
  • blk.19.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.20
  • blk.20.attn_norm.weight
    F32
    [8192]
  • blk.20.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.20.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.20.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.20.ffn_norm.weight
    F32
    [8192]
  • blk.20.attn_k.bias
    F32
    [1024]
  • blk.20.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.20.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.20.attn_q.bias
    F32
    [8192]
  • blk.20.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.20.attn_v.bias
    F32
    [1024]
  • blk.20.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.21
  • blk.21.attn_norm.weight
    F32
    [8192]
  • blk.21.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.21.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.21.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.21.ffn_norm.weight
    F32
    [8192]
  • blk.21.attn_k.bias
    F32
    [1024]
  • blk.21.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.21.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.21.attn_q.bias
    F32
    [8192]
  • blk.21.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.21.attn_v.bias
    F32
    [1024]
  • blk.21.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.22
  • blk.22.attn_norm.weight
    F32
    [8192]
  • blk.22.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.22.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.22.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.22.ffn_norm.weight
    F32
    [8192]
  • blk.22.attn_k.bias
    F32
    [1024]
  • blk.22.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.22.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.22.attn_q.bias
    F32
    [8192]
  • blk.22.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.22.attn_v.bias
    F32
    [1024]
  • blk.22.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.23
  • blk.23.attn_norm.weight
    F32
    [8192]
  • blk.23.ffn_norm.weight
    F32
    [8192]
  • blk.23.attn_k.bias
    F32
    [1024]
  • blk.23.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.23.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.23.attn_q.bias
    F32
    [8192]
  • blk.23.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.23.attn_v.bias
    F32
    [1024]
  • blk.23.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.23.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.23.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.23.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.24
  • blk.24.attn_norm.weight
    F32
    [8192]
  • blk.24.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.24.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.24.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.24.ffn_norm.weight
    F32
    [8192]
  • blk.24.attn_k.bias
    F32
    [1024]
  • blk.24.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.24.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.24.attn_q.bias
    F32
    [8192]
  • blk.24.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.24.attn_v.bias
    F32
    [1024]
  • blk.24.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.25
  • blk.25.attn_norm.weight
    F32
    [8192]
  • blk.25.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.25.ffn_norm.weight
    F32
    [8192]
  • blk.25.attn_k.bias
    F32
    [1024]
  • blk.25.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.25.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.25.attn_q.bias
    F32
    [8192]
  • blk.25.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.25.attn_v.bias
    F32
    [1024]
  • blk.25.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.25.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.25.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.26
  • blk.26.attn_norm.weight
    F32
    [8192]
  • blk.26.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.26.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.26.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.26.ffn_norm.weight
    F32
    [8192]
  • blk.26.attn_k.bias
    F32
    [1024]
  • blk.26.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.26.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.26.attn_q.bias
    F32
    [8192]
  • blk.26.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.26.attn_v.bias
    F32
    [1024]
  • blk.26.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.27
  • blk.27.attn_norm.weight
    F32
    [8192]
  • blk.27.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.27.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.27.ffn_norm.weight
    F32
    [8192]
  • blk.27.attn_k.bias
    F32
    [1024]
  • blk.27.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.27.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.27.attn_q.bias
    F32
    [8192]
  • blk.27.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.27.attn_v.bias
    F32
    [1024]
  • blk.27.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.27.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.28
  • blk.28.attn_norm.weight
    F32
    [8192]
  • blk.28.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.28.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.28.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.28.ffn_norm.weight
    F32
    [8192]
  • blk.28.attn_k.bias
    F32
    [1024]
  • blk.28.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.28.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.28.attn_q.bias
    F32
    [8192]
  • blk.28.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.28.attn_v.bias
    F32
    [1024]
  • blk.28.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.29
  • blk.29.attn_norm.weight
    F32
    [8192]
  • blk.29.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.29.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.29.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.29.ffn_norm.weight
    F32
    [8192]
  • blk.29.attn_k.bias
    F32
    [1024]
  • blk.29.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.29.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.29.attn_q.bias
    F32
    [8192]
  • blk.29.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.29.attn_v.bias
    F32
    [1024]
  • blk.29.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.30
  • blk.30.attn_norm.weight
    F32
    [8192]
  • blk.30.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.30.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.30.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.30.ffn_norm.weight
    F32
    [8192]
  • blk.30.attn_k.bias
    F32
    [1024]
  • blk.30.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.30.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.30.attn_q.bias
    F32
    [8192]
  • blk.30.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.30.attn_v.bias
    F32
    [1024]
  • blk.30.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.31
  • blk.31.attn_norm.weight
    F32
    [8192]
  • blk.31.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.31.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.31.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.31.ffn_norm.weight
    F32
    [8192]
  • blk.31.attn_k.bias
    F32
    [1024]
  • blk.31.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.31.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.31.attn_q.bias
    F32
    [8192]
  • blk.31.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.31.attn_v.bias
    F32
    [1024]
  • blk.31.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.32
  • blk.32.attn_norm.weight
    F32
    [8192]
  • blk.32.ffn_norm.weight
    F32
    [8192]
  • blk.32.attn_k.bias
    F32
    [1024]
  • blk.32.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.32.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.32.attn_q.bias
    F32
    [8192]
  • blk.32.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.32.attn_v.bias
    F32
    [1024]
  • blk.32.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.32.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.32.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.32.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.33
  • blk.33.attn_norm.weight
    F32
    [8192]
  • blk.33.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.33.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.33.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.33.ffn_norm.weight
    F32
    [8192]
  • blk.33.attn_k.bias
    F32
    [1024]
  • blk.33.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.33.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.33.attn_q.bias
    F32
    [8192]
  • blk.33.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.33.attn_v.bias
    F32
    [1024]
  • blk.33.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.34
  • blk.34.attn_norm.weight
    F32
    [8192]
  • blk.34.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.34.ffn_norm.weight
    F32
    [8192]
  • blk.34.attn_k.bias
    F32
    [1024]
  • blk.34.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.34.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.34.attn_q.bias
    F32
    [8192]
  • blk.34.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.34.attn_v.bias
    F32
    [1024]
  • blk.34.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.34.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.34.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.35
  • blk.35.attn_norm.weight
    F32
    [8192]
  • blk.35.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.35.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.35.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.35.ffn_norm.weight
    F32
    [8192]
  • blk.35.attn_k.bias
    F32
    [1024]
  • blk.35.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.35.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.35.attn_q.bias
    F32
    [8192]
  • blk.35.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.35.attn_v.bias
    F32
    [1024]
  • blk.35.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.36
  • blk.36.attn_norm.weight
    F32
    [8192]
  • blk.36.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.36.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.36.ffn_norm.weight
    F32
    [8192]
  • blk.36.attn_k.bias
    F32
    [1024]
  • blk.36.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.36.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.36.attn_q.bias
    F32
    [8192]
  • blk.36.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.36.attn_v.bias
    F32
    [1024]
  • blk.36.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.36.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.37
  • blk.37.attn_norm.weight
    F32
    [8192]
  • blk.37.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.37.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.37.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.37.ffn_norm.weight
    F32
    [8192]
  • blk.37.attn_k.bias
    F32
    [1024]
  • blk.37.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.37.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.37.attn_q.bias
    F32
    [8192]
  • blk.37.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.37.attn_v.bias
    F32
    [1024]
  • blk.37.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.38
  • blk.38.attn_norm.weight
    F32
    [8192]
  • blk.38.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.38.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.38.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.38.ffn_norm.weight
    F32
    [8192]
  • blk.38.attn_k.bias
    F32
    [1024]
  • blk.38.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.38.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.38.attn_q.bias
    F32
    [8192]
  • blk.38.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.38.attn_v.bias
    F32
    [1024]
  • blk.38.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.39
  • blk.39.attn_norm.weight
    F32
    [8192]
  • blk.39.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.39.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.39.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.39.ffn_norm.weight
    F32
    [8192]
  • blk.39.attn_k.bias
    F32
    [1024]
  • blk.39.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.39.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.39.attn_q.bias
    F32
    [8192]
  • blk.39.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.39.attn_v.bias
    F32
    [1024]
  • blk.39.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.40
  • blk.40.attn_norm.weight
    F32
    [8192]
  • blk.40.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.40.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.40.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.40.ffn_norm.weight
    F32
    [8192]
  • blk.40.attn_k.bias
    F32
    [1024]
  • blk.40.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.40.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.40.attn_q.bias
    F32
    [8192]
  • blk.40.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.40.attn_v.bias
    F32
    [1024]
  • blk.40.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.41
  • blk.41.attn_norm.weight
    F32
    [8192]
  • blk.41.ffn_norm.weight
    F32
    [8192]
  • blk.41.attn_k.bias
    F32
    [1024]
  • blk.41.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.41.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.41.attn_q.bias
    F32
    [8192]
  • blk.41.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.41.attn_v.bias
    F32
    [1024]
  • blk.41.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.41.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.41.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.41.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.42
  • blk.42.attn_norm.weight
    F32
    [8192]
  • blk.42.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.42.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.42.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.42.ffn_norm.weight
    F32
    [8192]
  • blk.42.attn_k.bias
    F32
    [1024]
  • blk.42.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.42.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.42.attn_q.bias
    F32
    [8192]
  • blk.42.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.42.attn_v.bias
    F32
    [1024]
  • blk.42.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.43
  • blk.43.attn_norm.weight
    F32
    [8192]
  • blk.43.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.43.ffn_norm.weight
    F32
    [8192]
  • blk.43.attn_k.bias
    F32
    [1024]
  • blk.43.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.43.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.43.attn_q.bias
    F32
    [8192]
  • blk.43.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.43.attn_v.bias
    F32
    [1024]
  • blk.43.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.43.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.43.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.44
  • blk.44.attn_norm.weight
    F32
    [8192]
  • blk.44.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.44.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.44.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.44.ffn_norm.weight
    F32
    [8192]
  • blk.44.attn_k.bias
    F32
    [1024]
  • blk.44.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.44.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.44.attn_q.bias
    F32
    [8192]
  • blk.44.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.44.attn_v.bias
    F32
    [1024]
  • blk.44.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.45
  • blk.45.attn_norm.weight
    F32
    [8192]
  • blk.45.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.45.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.45.ffn_norm.weight
    F32
    [8192]
  • blk.45.attn_k.bias
    F32
    [1024]
  • blk.45.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.45.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.45.attn_q.bias
    F32
    [8192]
  • blk.45.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.45.attn_v.bias
    F32
    [1024]
  • blk.45.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.45.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.46
  • blk.46.attn_norm.weight
    F32
    [8192]
  • blk.46.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.46.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.46.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.46.ffn_norm.weight
    F32
    [8192]
  • blk.46.attn_k.bias
    F32
    [1024]
  • blk.46.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.46.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.46.attn_q.bias
    F32
    [8192]
  • blk.46.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.46.attn_v.bias
    F32
    [1024]
  • blk.46.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.47
  • blk.47.attn_norm.weight
    F32
    [8192]
  • blk.47.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.47.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.47.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.47.ffn_norm.weight
    F32
    [8192]
  • blk.47.attn_k.bias
    F32
    [1024]
  • blk.47.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.47.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.47.attn_q.bias
    F32
    [8192]
  • blk.47.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.47.attn_v.bias
    F32
    [1024]
  • blk.47.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.48
  • blk.48.attn_norm.weight
    F32
    [8192]
  • blk.48.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.48.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.48.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.48.ffn_norm.weight
    F32
    [8192]
  • blk.48.attn_k.bias
    F32
    [1024]
  • blk.48.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.48.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.48.attn_q.bias
    F32
    [8192]
  • blk.48.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.48.attn_v.bias
    F32
    [1024]
  • blk.48.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.49
  • blk.49.attn_norm.weight
    F32
    [8192]
  • blk.49.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.49.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.49.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.49.ffn_norm.weight
    F32
    [8192]
  • blk.49.attn_k.bias
    F32
    [1024]
  • blk.49.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.49.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.49.attn_q.bias
    F32
    [8192]
  • blk.49.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.49.attn_v.bias
    F32
    [1024]
  • blk.49.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.50
  • blk.50.attn_norm.weight
    F32
    [8192]
  • blk.50.ffn_norm.weight
    F32
    [8192]
  • blk.50.attn_k.bias
    F32
    [1024]
  • blk.50.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.50.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.50.attn_q.bias
    F32
    [8192]
  • blk.50.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.50.attn_v.bias
    F32
    [1024]
  • blk.50.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.50.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.50.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.50.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.51
  • blk.51.attn_norm.weight
    F32
    [8192]
  • blk.51.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.51.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.51.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.51.ffn_norm.weight
    F32
    [8192]
  • blk.51.attn_k.bias
    F32
    [1024]
  • blk.51.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.51.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.51.attn_q.bias
    F32
    [8192]
  • blk.51.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.51.attn_v.bias
    F32
    [1024]
  • blk.51.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.52
  • blk.52.attn_norm.weight
    F32
    [8192]
  • blk.52.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.52.ffn_norm.weight
    F32
    [8192]
  • blk.52.attn_k.bias
    F32
    [1024]
  • blk.52.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.52.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.52.attn_q.bias
    F32
    [8192]
  • blk.52.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.52.attn_v.bias
    F32
    [1024]
  • blk.52.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.52.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.52.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.53
  • blk.53.attn_norm.weight
    F32
    [8192]
  • blk.53.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.53.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.53.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.53.ffn_norm.weight
    F32
    [8192]
  • blk.53.attn_k.bias
    F32
    [1024]
  • blk.53.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.53.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.53.attn_q.bias
    F32
    [8192]
  • blk.53.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.53.attn_v.bias
    F32
    [1024]
  • blk.53.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.54
  • blk.54.attn_norm.weight
    F32
    [8192]
  • blk.54.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.54.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.54.ffn_norm.weight
    F32
    [8192]
  • blk.54.attn_k.bias
    F32
    [1024]
  • blk.54.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.54.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.54.attn_q.bias
    F32
    [8192]
  • blk.54.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.54.attn_v.bias
    F32
    [1024]
  • blk.54.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.54.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.55
  • blk.55.attn_norm.weight
    F32
    [8192]
  • blk.55.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.55.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.55.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.55.ffn_norm.weight
    F32
    [8192]
  • blk.55.attn_k.bias
    F32
    [1024]
  • blk.55.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.55.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.55.attn_q.bias
    F32
    [8192]
  • blk.55.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.55.attn_v.bias
    F32
    [1024]
  • blk.55.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.56
  • blk.56.attn_norm.weight
    F32
    [8192]
  • blk.56.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.56.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.56.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.56.ffn_norm.weight
    F32
    [8192]
  • blk.56.attn_k.bias
    F32
    [1024]
  • blk.56.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.56.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.56.attn_q.bias
    F32
    [8192]
  • blk.56.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.56.attn_v.bias
    F32
    [1024]
  • blk.56.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.57
  • blk.57.attn_norm.weight
    F32
    [8192]
  • blk.57.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.57.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.57.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.57.ffn_norm.weight
    F32
    [8192]
  • blk.57.attn_k.bias
    F32
    [1024]
  • blk.57.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.57.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.57.attn_q.bias
    F32
    [8192]
  • blk.57.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.57.attn_v.bias
    F32
    [1024]
  • blk.57.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.58
  • blk.58.attn_norm.weight
    F32
    [8192]
  • blk.58.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.58.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.58.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.58.ffn_norm.weight
    F32
    [8192]
  • blk.58.attn_k.bias
    F32
    [1024]
  • blk.58.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.58.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.58.attn_q.bias
    F32
    [8192]
  • blk.58.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.58.attn_v.bias
    F32
    [1024]
  • blk.58.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.59
  • blk.59.attn_norm.weight
    F32
    [8192]
  • blk.59.ffn_norm.weight
    F32
    [8192]
  • blk.59.attn_k.bias
    F32
    [1024]
  • blk.59.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.59.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.59.attn_q.bias
    F32
    [8192]
  • blk.59.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.59.attn_v.bias
    F32
    [1024]
  • blk.59.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.59.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.59.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.59.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.60
  • blk.60.attn_norm.weight
    F32
    [8192]
  • blk.60.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.60.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.60.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.60.ffn_norm.weight
    F32
    [8192]
  • blk.60.attn_k.bias
    F32
    [1024]
  • blk.60.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.60.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.60.attn_q.bias
    F32
    [8192]
  • blk.60.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.60.attn_v.bias
    F32
    [1024]
  • blk.60.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.61
  • blk.61.attn_norm.weight
    F32
    [8192]
  • blk.61.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.61.ffn_norm.weight
    F32
    [8192]
  • blk.61.attn_k.bias
    F32
    [1024]
  • blk.61.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.61.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.61.attn_q.bias
    F32
    [8192]
  • blk.61.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.61.attn_v.bias
    F32
    [1024]
  • blk.61.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.61.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.61.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.62
  • blk.62.attn_norm.weight
    F32
    [8192]
  • blk.62.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.62.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.62.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.62.ffn_norm.weight
    F32
    [8192]
  • blk.62.attn_k.bias
    F32
    [1024]
  • blk.62.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.62.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.62.attn_q.bias
    F32
    [8192]
  • blk.62.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.62.attn_v.bias
    F32
    [1024]
  • blk.62.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.63
  • blk.63.attn_norm.weight
    F32
    [8192]
  • blk.63.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.63.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.63.ffn_norm.weight
    F32
    [8192]
  • blk.63.attn_k.bias
    F32
    [1024]
  • blk.63.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.63.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.63.attn_q.bias
    F32
    [8192]
  • blk.63.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.63.attn_v.bias
    F32
    [1024]
  • blk.63.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.63.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.64
  • blk.64.attn_norm.weight
    F32
    [8192]
  • blk.64.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.64.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.64.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.64.ffn_norm.weight
    F32
    [8192]
  • blk.64.attn_k.bias
    F32
    [1024]
  • blk.64.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.64.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.64.attn_q.bias
    F32
    [8192]
  • blk.64.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.64.attn_v.bias
    F32
    [1024]
  • blk.64.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.65
  • blk.65.attn_norm.weight
    F32
    [8192]
  • blk.65.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.65.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.65.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.65.ffn_norm.weight
    F32
    [8192]
  • blk.65.attn_k.bias
    F32
    [1024]
  • blk.65.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.65.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.65.attn_q.bias
    F32
    [8192]
  • blk.65.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.65.attn_v.bias
    F32
    [1024]
  • blk.65.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.66
  • blk.66.attn_norm.weight
    F32
    [8192]
  • blk.66.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.66.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.66.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.66.ffn_norm.weight
    F32
    [8192]
  • blk.66.attn_k.bias
    F32
    [1024]
  • blk.66.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.66.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.66.attn_q.bias
    F32
    [8192]
  • blk.66.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.66.attn_v.bias
    F32
    [1024]
  • blk.66.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.67
  • blk.67.attn_norm.weight
    F32
    [8192]
  • blk.67.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.67.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.67.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.67.ffn_norm.weight
    F32
    [8192]
  • blk.67.attn_k.bias
    F32
    [1024]
  • blk.67.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.67.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.67.attn_q.bias
    F32
    [8192]
  • blk.67.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.67.attn_v.bias
    F32
    [1024]
  • blk.67.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.68
  • blk.68.attn_norm.weight
    F32
    [8192]
  • blk.68.ffn_norm.weight
    F32
    [8192]
  • blk.68.attn_k.bias
    F32
    [1024]
  • blk.68.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.68.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.68.attn_q.bias
    F32
    [8192]
  • blk.68.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.68.attn_v.bias
    F32
    [1024]
  • blk.68.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.68.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.68.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.68.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.69
  • blk.69.attn_norm.weight
    F32
    [8192]
  • blk.69.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.69.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.69.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.69.ffn_norm.weight
    F32
    [8192]
  • blk.69.attn_k.bias
    F32
    [1024]
  • blk.69.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.69.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.69.attn_q.bias
    F32
    [8192]
  • blk.69.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.69.attn_v.bias
    F32
    [1024]
  • blk.69.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.70
  • blk.70.attn_norm.weight
    F32
    [8192]
  • blk.70.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.70.ffn_norm.weight
    F32
    [8192]
  • blk.70.attn_k.bias
    F32
    [1024]
  • blk.70.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.70.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.70.attn_q.bias
    F32
    [8192]
  • blk.70.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.70.attn_v.bias
    F32
    [1024]
  • blk.70.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.70.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.70.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.71
  • blk.71.attn_norm.weight
    F32
    [8192]
  • blk.71.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.71.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.71.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.71.ffn_norm.weight
    F32
    [8192]
  • blk.71.attn_k.bias
    F32
    [1024]
  • blk.71.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.71.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.71.attn_q.bias
    F32
    [8192]
  • blk.71.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.71.attn_v.bias
    F32
    [1024]
  • blk.71.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.72
  • blk.72.attn_norm.weight
    F32
    [8192]
  • blk.72.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.72.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.72.ffn_norm.weight
    F32
    [8192]
  • blk.72.attn_k.bias
    F32
    [1024]
  • blk.72.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.72.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.72.attn_q.bias
    F32
    [8192]
  • blk.72.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.72.attn_v.bias
    F32
    [1024]
  • blk.72.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.72.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.73
  • blk.73.attn_norm.weight
    F32
    [8192]
  • blk.73.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.73.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.73.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.73.ffn_norm.weight
    F32
    [8192]
  • blk.73.attn_k.bias
    F32
    [1024]
  • blk.73.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.73.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.73.attn_q.bias
    F32
    [8192]
  • blk.73.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.73.attn_v.bias
    F32
    [1024]
  • blk.73.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.74
  • blk.74.attn_norm.weight
    F32
    [8192]
  • blk.74.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.74.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.74.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.74.ffn_norm.weight
    F32
    [8192]
  • blk.74.attn_k.bias
    F32
    [1024]
  • blk.74.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.74.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.74.attn_q.bias
    F32
    [8192]
  • blk.74.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.74.attn_v.bias
    F32
    [1024]
  • blk.74.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.75
  • blk.75.attn_norm.weight
    F32
    [8192]
  • blk.75.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.75.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.75.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.75.ffn_norm.weight
    F32
    [8192]
  • blk.75.attn_k.bias
    F32
    [1024]
  • blk.75.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.75.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.75.attn_q.bias
    F32
    [8192]
  • blk.75.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.75.attn_v.bias
    F32
    [1024]
  • blk.75.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.76
  • blk.76.attn_norm.weight
    F32
    [8192]
  • blk.76.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.76.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.76.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.76.ffn_norm.weight
    F32
    [8192]
  • blk.76.attn_k.bias
    F32
    [1024]
  • blk.76.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.76.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.76.attn_q.bias
    F32
    [8192]
  • blk.76.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.76.attn_v.bias
    F32
    [1024]
  • blk.76.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.77
  • blk.77.attn_norm.weight
    F32
    [8192]
  • blk.77.ffn_norm.weight
    F32
    [8192]
  • blk.77.attn_k.bias
    F32
    [1024]
  • blk.77.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.77.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.77.attn_q.bias
    F32
    [8192]
  • blk.77.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.77.attn_v.bias
    F32
    [1024]
  • blk.77.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.77.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.77.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.77.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.78
  • blk.78.attn_norm.weight
    F32
    [8192]
  • blk.78.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.78.ffn_gate.weight
    Q8_0
    [8192 29568]
  • blk.78.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.78.ffn_norm.weight
    F32
    [8192]
  • blk.78.attn_k.bias
    F32
    [1024]
  • blk.78.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.78.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.78.attn_q.bias
    F32
    [8192]
  • blk.78.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.78.attn_v.bias
    F32
    [1024]
  • blk.78.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.79
  • blk.79.attn_norm.weight
    F32
    [8192]
  • blk.79.ffn_up.weight
    Q8_0
    [8192 29568]
  • blk.79.ffn_norm.weight
    F32
    [8192]
  • blk.79.attn_k.bias
    F32
    [1024]
  • blk.79.attn_k.weight
    Q8_0
    [8192 1024]
  • blk.79.attn_output.weight
    Q8_0
    [8192 8192]
  • blk.79.attn_q.bias
    F32
    [8192]
  • blk.79.attn_q.weight
    Q8_0
    [8192 8192]
  • blk.79.attn_v.bias
    F32
    [1024]
  • blk.79.attn_v.weight
    Q8_0
    [8192 1024]
  • blk.79.ffn_down.weight
    Q8_0
    [29568 8192]
  • blk.79.ffn_gate.weight
    Q8_0
    [8192 29568]
  • output.weight
    Q8_0
    [8192 152064]
  • output_norm.weight
    F32
    [8192]