latest
9.2GB
82 Pulls Updated 4 months ago
f83629527eb6 · 9.2GB
-
general.architectureqwen2
-
general.file_typeQ4_K_M
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv40
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count40
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length13696
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_K[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ8_0[13696 5120]
-
blk.0.ffn_gate.weightQ4_K[5120 13696]
-
blk.0.ffn_up.weightQ4_K[5120 13696]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[5120]
-
blk.0.attn_k.weightQ4_K[5120 5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightQ4_K[5120 5120]
-
blk.0.attn_v.biasF32[5120]
-
blk.0.attn_v.weightQ6_K[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ8_0[13696 5120]
-
blk.1.ffn_gate.weightQ4_K[5120 13696]
-
blk.1.ffn_up.weightQ4_K[5120 13696]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[5120]
-
blk.1.attn_k.weightQ4_K[5120 5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightQ4_K[5120 5120]
-
blk.1.attn_v.biasF32[5120]
-
blk.1.attn_v.weightQ6_K[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ5_0[13696 5120]
-
blk.2.ffn_gate.weightQ4_K[5120 13696]
-
blk.2.ffn_up.weightQ4_K[5120 13696]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[5120]
-
blk.2.attn_k.weightQ4_K[5120 5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightQ4_K[5120 5120]
-
blk.2.attn_v.biasF32[5120]
-
blk.2.attn_v.weightQ4_K[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ5_0[13696 5120]
-
blk.3.ffn_gate.weightQ4_K[5120 13696]
-
blk.3.ffn_up.weightQ4_K[5120 13696]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[5120]
-
blk.3.attn_k.weightQ4_K[5120 5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightQ4_K[5120 5120]
-
blk.3.attn_v.biasF32[5120]
-
blk.3.attn_v.weightQ6_K[5120 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ8_0[13696 5120]
-
blk.4.ffn_gate.weightQ4_K[5120 13696]
-
blk.4.ffn_up.weightQ4_K[5120 13696]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[5120]
-
blk.4.attn_k.weightQ4_K[5120 5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightQ4_K[5120 5120]
-
blk.4.attn_v.biasF32[5120]
-
blk.4.attn_v.weightQ4_K[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ5_0[13696 5120]
-
blk.5.ffn_gate.weightQ4_K[5120 13696]
-
blk.5.ffn_up.weightQ4_K[5120 13696]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[5120]
-
blk.5.attn_k.weightQ4_K[5120 5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightQ4_K[5120 5120]
-
blk.5.attn_v.biasF32[5120]
-
blk.5.attn_v.weightQ4_K[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ5_0[13696 5120]
-
blk.6.ffn_gate.weightQ4_K[5120 13696]
-
blk.6.ffn_up.weightQ4_K[5120 13696]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[5120]
-
blk.6.attn_k.weightQ4_K[5120 5120]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightQ4_K[5120 5120]
-
blk.6.attn_v.biasF32[5120]
-
blk.6.attn_v.weightQ6_K[5120 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ8_0[13696 5120]
-
blk.7.ffn_gate.weightQ4_K[5120 13696]
-
blk.7.ffn_up.weightQ4_K[5120 13696]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[5120]
-
blk.7.attn_k.weightQ4_K[5120 5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightQ4_K[5120 5120]
-
blk.7.attn_v.biasF32[5120]
-
blk.7.attn_v.weightQ4_K[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ5_0[13696 5120]
-
blk.8.ffn_gate.weightQ4_K[5120 13696]
-
blk.8.ffn_up.weightQ4_K[5120 13696]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[5120]
-
blk.8.attn_k.weightQ4_K[5120 5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightQ4_K[5120 5120]
-
blk.8.attn_v.biasF32[5120]
-
blk.8.attn_v.weightQ4_K[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ5_0[13696 5120]
-
blk.9.ffn_gate.weightQ4_K[5120 13696]
-
blk.9.ffn_up.weightQ4_K[5120 13696]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[5120]
-
blk.9.attn_k.weightQ4_K[5120 5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightQ4_K[5120 5120]
-
blk.9.attn_v.biasF32[5120]
-
blk.9.attn_v.weightQ6_K[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ8_0[13696 5120]
-
blk.10.ffn_gate.weightQ4_K[5120 13696]
-
blk.10.ffn_up.weightQ4_K[5120 13696]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[5120]
-
blk.10.attn_k.weightQ4_K[5120 5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightQ4_K[5120 5120]
-
blk.10.attn_v.biasF32[5120]
-
blk.10.attn_v.weightQ6_K[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ8_0[13696 5120]
-
blk.11.ffn_gate.weightQ4_K[5120 13696]
-
blk.11.ffn_up.weightQ4_K[5120 13696]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[5120]
-
blk.11.attn_k.weightQ4_K[5120 5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightQ4_K[5120 5120]
-
blk.11.attn_v.biasF32[5120]
-
blk.11.attn_v.weightQ6_K[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ8_0[13696 5120]
-
blk.12.ffn_gate.weightQ4_K[5120 13696]
-
blk.12.ffn_up.weightQ4_K[5120 13696]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[5120]
-
blk.12.attn_k.weightQ4_K[5120 5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightQ4_K[5120 5120]
-
blk.12.attn_v.biasF32[5120]
-
blk.12.attn_v.weightQ6_K[5120 5120]
-
blk.13.attn_k.biasF32[5120]
-
blk.13.attn_k.weightQ4_K[5120 5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightQ4_K[5120 5120]
-
blk.13.attn_v.biasF32[5120]
-
blk.13.attn_v.weightQ4_K[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ8_0[13696 5120]
-
blk.13.ffn_gate.weightQ4_K[5120 13696]
-
blk.13.ffn_up.weightQ4_K[5120 13696]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ5_0[13696 5120]
-
blk.14.ffn_gate.weightQ4_K[5120 13696]
-
blk.14.ffn_up.weightQ4_K[5120 13696]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[5120]
-
blk.14.attn_k.weightQ4_K[5120 5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightQ4_K[5120 5120]
-
blk.14.attn_v.biasF32[5120]
-
blk.14.attn_v.weightQ4_K[5120 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ5_0[13696 5120]
-
blk.15.ffn_gate.weightQ4_K[5120 13696]
-
blk.15.ffn_up.weightQ4_K[5120 13696]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[5120]
-
blk.15.attn_k.weightQ4_K[5120 5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightQ4_K[5120 5120]
-
blk.15.attn_v.biasF32[5120]
-
blk.15.attn_v.weightQ4_K[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ8_0[13696 5120]
-
blk.16.ffn_gate.weightQ4_K[5120 13696]
-
blk.16.ffn_up.weightQ4_K[5120 13696]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[5120]
-
blk.16.attn_k.weightQ4_K[5120 5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightQ4_K[5120 5120]
-
blk.16.attn_v.biasF32[5120]
-
blk.16.attn_v.weightQ6_K[5120 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ5_0[13696 5120]
-
blk.17.ffn_gate.weightQ4_K[5120 13696]
-
blk.17.ffn_up.weightQ4_K[5120 13696]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[5120]
-
blk.17.attn_k.weightQ4_K[5120 5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightQ4_K[5120 5120]
-
blk.17.attn_v.biasF32[5120]
-
blk.17.attn_v.weightQ4_K[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ5_0[13696 5120]
-
blk.18.ffn_gate.weightQ4_K[5120 13696]
-
blk.18.ffn_up.weightQ4_K[5120 13696]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[5120]
-
blk.18.attn_k.weightQ4_K[5120 5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightQ4_K[5120 5120]
-
blk.18.attn_v.biasF32[5120]
-
blk.18.attn_v.weightQ4_K[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ8_0[13696 5120]
-
blk.19.ffn_gate.weightQ4_K[5120 13696]
-
blk.19.ffn_up.weightQ4_K[5120 13696]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[5120]
-
blk.19.attn_k.weightQ4_K[5120 5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightQ4_K[5120 5120]
-
blk.19.attn_v.biasF32[5120]
-
blk.19.attn_v.weightQ6_K[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ5_0[13696 5120]
-
blk.20.ffn_gate.weightQ4_K[5120 13696]
-
blk.20.ffn_up.weightQ4_K[5120 13696]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[5120]
-
blk.20.attn_k.weightQ4_K[5120 5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightQ4_K[5120 5120]
-
blk.20.attn_v.biasF32[5120]
-
blk.20.attn_v.weightQ4_K[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ5_0[13696 5120]
-
blk.21.ffn_gate.weightQ4_K[5120 13696]
-
blk.21.ffn_up.weightQ4_K[5120 13696]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[5120]
-
blk.21.attn_k.weightQ4_K[5120 5120]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightQ4_K[5120 5120]
-
blk.21.attn_v.biasF32[5120]
-
blk.21.attn_v.weightQ4_K[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ8_0[13696 5120]
-
blk.22.ffn_gate.weightQ4_K[5120 13696]
-
blk.22.ffn_up.weightQ4_K[5120 13696]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[5120]
-
blk.22.attn_k.weightQ4_K[5120 5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightQ4_K[5120 5120]
-
blk.22.attn_v.biasF32[5120]
-
blk.22.attn_v.weightQ6_K[5120 5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ5_0[13696 5120]
-
blk.23.ffn_gate.weightQ4_K[5120 13696]
-
blk.23.ffn_up.weightQ4_K[5120 13696]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[5120]
-
blk.23.attn_k.weightQ4_K[5120 5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightQ4_K[5120 5120]
-
blk.23.attn_v.biasF32[5120]
-
blk.23.attn_v.weightQ4_K[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ5_0[13696 5120]
-
blk.24.ffn_gate.weightQ4_K[5120 13696]
-
blk.24.ffn_up.weightQ4_K[5120 13696]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[5120]
-
blk.24.attn_k.weightQ4_K[5120 5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightQ4_K[5120 5120]
-
blk.24.attn_v.biasF32[5120]
-
blk.24.attn_v.weightQ4_K[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ8_0[13696 5120]
-
blk.25.ffn_gate.weightQ4_K[5120 13696]
-
blk.25.ffn_up.weightQ4_K[5120 13696]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[5120]
-
blk.25.attn_k.weightQ4_K[5120 5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightQ4_K[5120 5120]
-
blk.25.attn_v.biasF32[5120]
-
blk.25.attn_v.weightQ6_K[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ5_0[13696 5120]
-
blk.26.ffn_gate.weightQ4_K[5120 13696]
-
blk.26.ffn_up.weightQ4_K[5120 13696]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[5120]
-
blk.26.attn_k.weightQ4_K[5120 5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightQ4_K[5120 5120]
-
blk.26.attn_v.biasF32[5120]
-
blk.26.attn_v.weightQ4_K[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ5_0[13696 5120]
-
blk.27.ffn_gate.weightQ4_K[5120 13696]
-
blk.27.ffn_up.weightQ4_K[5120 13696]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[5120]
-
blk.27.attn_k.weightQ4_K[5120 5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightQ4_K[5120 5120]
-
blk.27.attn_v.biasF32[5120]
-
blk.27.attn_v.weightQ4_K[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ8_0[13696 5120]
-
blk.28.ffn_gate.weightQ4_K[5120 13696]
-
blk.28.ffn_up.weightQ4_K[5120 13696]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[5120]
-
blk.28.attn_k.weightQ4_K[5120 5120]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightQ4_K[5120 5120]
-
blk.28.attn_v.biasF32[5120]
-
blk.28.attn_v.weightQ6_K[5120 5120]
-
blk.29.attn_k.biasF32[5120]
-
blk.29.attn_k.weightQ4_K[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightQ4_K[5120 5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ5_0[13696 5120]
-
blk.29.ffn_gate.weightQ4_K[5120 13696]
-
blk.29.ffn_up.weightQ4_K[5120 13696]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.attn_v.biasF32[5120]
-
blk.29.attn_v.weightQ4_K[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ5_0[13696 5120]
-
blk.30.ffn_gate.weightQ4_K[5120 13696]
-
blk.30.ffn_up.weightQ4_K[5120 13696]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[5120]
-
blk.30.attn_k.weightQ4_K[5120 5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightQ4_K[5120 5120]
-
blk.30.attn_v.biasF32[5120]
-
blk.30.attn_v.weightQ4_K[5120 5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ8_0[13696 5120]
-
blk.31.ffn_gate.weightQ4_K[5120 13696]
-
blk.31.ffn_up.weightQ4_K[5120 13696]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[5120]
-
blk.31.attn_k.weightQ4_K[5120 5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightQ4_K[5120 5120]
-
blk.31.attn_v.biasF32[5120]
-
blk.31.attn_v.weightQ6_K[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ5_0[13696 5120]
-
blk.32.ffn_gate.weightQ4_K[5120 13696]
-
blk.32.ffn_up.weightQ4_K[5120 13696]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[5120]
-
blk.32.attn_k.weightQ4_K[5120 5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightQ4_K[5120 5120]
-
blk.32.attn_v.biasF32[5120]
-
blk.32.attn_v.weightQ4_K[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ5_0[13696 5120]
-
blk.33.ffn_gate.weightQ4_K[5120 13696]
-
blk.33.ffn_up.weightQ4_K[5120 13696]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[5120]
-
blk.33.attn_k.weightQ4_K[5120 5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightQ4_K[5120 5120]
-
blk.33.attn_v.biasF32[5120]
-
blk.33.attn_v.weightQ4_K[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ8_0[13696 5120]
-
blk.34.ffn_gate.weightQ4_K[5120 13696]
-
blk.34.ffn_up.weightQ4_K[5120 13696]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[5120]
-
blk.34.attn_k.weightQ4_K[5120 5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightQ4_K[5120 5120]
-
blk.34.attn_v.biasF32[5120]
-
blk.34.attn_v.weightQ6_K[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ8_0[13696 5120]
-
blk.35.ffn_gate.weightQ4_K[5120 13696]
-
blk.35.ffn_up.weightQ4_K[5120 13696]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[5120]
-
blk.35.attn_k.weightQ4_K[5120 5120]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightQ4_K[5120 5120]
-
blk.35.attn_v.biasF32[5120]
-
blk.35.attn_v.weightQ6_K[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ8_0[13696 5120]
-
blk.36.ffn_gate.weightQ4_K[5120 13696]
-
blk.36.ffn_up.weightQ4_K[5120 13696]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[5120]
-
blk.36.attn_k.weightQ4_K[5120 5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightQ4_K[5120 5120]
-
blk.36.attn_v.biasF32[5120]
-
blk.36.attn_v.weightQ6_K[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ8_0[13696 5120]
-
blk.37.ffn_gate.weightQ4_K[5120 13696]
-
blk.37.ffn_up.weightQ4_K[5120 13696]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[5120]
-
blk.37.attn_k.weightQ4_K[5120 5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightQ4_K[5120 5120]
-
blk.37.attn_v.biasF32[5120]
-
blk.37.attn_v.weightQ6_K[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ8_0[13696 5120]
-
blk.38.ffn_gate.weightQ4_K[5120 13696]
-
blk.38.ffn_up.weightQ4_K[5120 13696]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[5120]
-
blk.38.attn_k.weightQ4_K[5120 5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightQ4_K[5120 5120]
-
blk.38.attn_v.biasF32[5120]
-
blk.38.attn_v.weightQ6_K[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ8_0[13696 5120]
-
blk.39.ffn_gate.weightQ4_K[5120 13696]
-
blk.39.ffn_up.weightQ4_K[5120 13696]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[5120]
-
blk.39.attn_k.weightQ4_K[5120 5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightQ4_K[5120 5120]
-
blk.39.attn_v.biasF32[5120]
-
blk.39.attn_v.weightQ6_K[5120 5120]
-
output.weightQ6_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39