latest
12GB
32B
113 Pulls Updated 5 months ago
d2e35984c923 · 12GB
-
general.architectureqwen2
-
general.file_typeQ2_K
-
general.quantization_version2
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27392
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ3_K[27392 5120]
-
blk.0.ffn_gate.weightQ2_K[5120 27392]
-
blk.0.ffn_up.weightQ2_K[5120 27392]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ2_K[5120 1024]
-
blk.0.attn_output.weightQ3_K[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightQ2_K[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ3_K[27392 5120]
-
blk.1.ffn_gate.weightQ2_K[5120 27392]
-
blk.1.ffn_up.weightQ2_K[5120 27392]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ2_K[5120 1024]
-
blk.1.attn_output.weightQ3_K[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightQ2_K[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ3_K[27392 5120]
-
blk.2.ffn_gate.weightQ2_K[5120 27392]
-
blk.2.ffn_up.weightQ2_K[5120 27392]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ2_K[5120 1024]
-
blk.2.attn_output.weightQ3_K[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightQ2_K[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.3.ffn_gate.weightQ2_K[5120 27392]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ2_K[5120 1024]
-
blk.3.attn_output.weightQ3_K[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightQ2_K[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ3_K[27392 5120]
-
blk.3.ffn_up.weightQ2_K[5120 27392]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ3_K[27392 5120]
-
blk.4.ffn_gate.weightQ2_K[5120 27392]
-
blk.4.ffn_up.weightQ2_K[5120 27392]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ2_K[5120 1024]
-
blk.4.attn_output.weightQ3_K[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightQ2_K[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ3_K[27392 5120]
-
blk.5.ffn_gate.weightQ2_K[5120 27392]
-
blk.5.ffn_up.weightQ2_K[5120 27392]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ2_K[5120 1024]
-
blk.5.attn_output.weightQ3_K[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightQ2_K[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ3_K[27392 5120]
-
blk.6.ffn_gate.weightQ2_K[5120 27392]
-
blk.6.ffn_up.weightQ2_K[5120 27392]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ2_K[5120 1024]
-
blk.6.attn_output.weightQ3_K[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightQ2_K[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ3_K[27392 5120]
-
blk.7.ffn_gate.weightQ2_K[5120 27392]
-
blk.7.ffn_up.weightQ2_K[5120 27392]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ2_K[5120 1024]
-
blk.7.attn_output.weightQ3_K[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightQ2_K[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.ffn_gate.weightQ2_K[5120 27392]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ2_K[5120 1024]
-
blk.8.attn_output.weightQ3_K[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightQ2_K[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ3_K[27392 5120]
-
blk.8.ffn_up.weightQ2_K[5120 27392]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ3_K[27392 5120]
-
blk.9.ffn_gate.weightQ2_K[5120 27392]
-
blk.9.ffn_up.weightQ2_K[5120 27392]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ2_K[5120 1024]
-
blk.9.attn_output.weightQ3_K[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightQ2_K[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ3_K[27392 5120]
-
blk.10.ffn_gate.weightQ2_K[5120 27392]
-
blk.10.ffn_up.weightQ2_K[5120 27392]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ2_K[5120 1024]
-
blk.10.attn_output.weightQ3_K[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightQ2_K[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ3_K[27392 5120]
-
blk.11.ffn_gate.weightQ2_K[5120 27392]
-
blk.11.ffn_up.weightQ2_K[5120 27392]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ2_K[5120 1024]
-
blk.11.attn_output.weightQ3_K[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightQ2_K[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ3_K[27392 5120]
-
blk.12.ffn_gate.weightQ2_K[5120 27392]
-
blk.12.ffn_up.weightQ2_K[5120 27392]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ2_K[5120 1024]
-
blk.12.attn_output.weightQ3_K[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightQ2_K[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.ffn_gate.weightQ2_K[5120 27392]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ2_K[5120 1024]
-
blk.13.attn_output.weightQ3_K[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightQ2_K[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ3_K[27392 5120]
-
blk.13.ffn_up.weightQ2_K[5120 27392]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ3_K[27392 5120]
-
blk.14.ffn_gate.weightQ2_K[5120 27392]
-
blk.14.ffn_up.weightQ2_K[5120 27392]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ2_K[5120 1024]
-
blk.14.attn_output.weightQ3_K[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightQ2_K[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ3_K[27392 5120]
-
blk.15.ffn_gate.weightQ2_K[5120 27392]
-
blk.15.ffn_up.weightQ2_K[5120 27392]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ2_K[5120 1024]
-
blk.15.attn_output.weightQ3_K[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightQ2_K[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ3_K[27392 5120]
-
blk.16.ffn_gate.weightQ2_K[5120 27392]
-
blk.16.ffn_up.weightQ2_K[5120 27392]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ2_K[5120 1024]
-
blk.16.attn_output.weightQ3_K[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightQ2_K[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ3_K[27392 5120]
-
blk.17.ffn_gate.weightQ2_K[5120 27392]
-
blk.17.ffn_up.weightQ2_K[5120 27392]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ2_K[5120 1024]
-
blk.17.attn_output.weightQ3_K[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightQ2_K[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.ffn_gate.weightQ2_K[5120 27392]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ2_K[5120 1024]
-
blk.18.attn_output.weightQ3_K[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightQ2_K[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ3_K[27392 5120]
-
blk.18.ffn_up.weightQ2_K[5120 27392]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ3_K[27392 5120]
-
blk.19.ffn_gate.weightQ2_K[5120 27392]
-
blk.19.ffn_up.weightQ2_K[5120 27392]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ2_K[5120 1024]
-
blk.19.attn_output.weightQ3_K[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightQ2_K[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ3_K[27392 5120]
-
blk.20.ffn_gate.weightQ2_K[5120 27392]
-
blk.20.ffn_up.weightQ2_K[5120 27392]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ2_K[5120 1024]
-
blk.20.attn_output.weightQ3_K[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightQ2_K[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ3_K[27392 5120]
-
blk.21.ffn_gate.weightQ2_K[5120 27392]
-
blk.21.ffn_up.weightQ2_K[5120 27392]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ2_K[5120 1024]
-
blk.21.attn_output.weightQ3_K[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightQ2_K[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ3_K[27392 5120]
-
blk.22.ffn_gate.weightQ2_K[5120 27392]
-
blk.22.ffn_up.weightQ2_K[5120 27392]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ2_K[5120 1024]
-
blk.22.attn_output.weightQ3_K[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightQ2_K[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.23.ffn_gate.weightQ2_K[5120 27392]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ2_K[5120 1024]
-
blk.23.attn_output.weightQ3_K[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightQ2_K[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ3_K[27392 5120]
-
blk.23.ffn_up.weightQ2_K[5120 27392]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ3_K[27392 5120]
-
blk.24.ffn_gate.weightQ2_K[5120 27392]
-
blk.24.ffn_up.weightQ2_K[5120 27392]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ2_K[5120 1024]
-
blk.24.attn_output.weightQ3_K[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightQ2_K[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ3_K[27392 5120]
-
blk.25.ffn_gate.weightQ2_K[5120 27392]
-
blk.25.ffn_up.weightQ2_K[5120 27392]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ2_K[5120 1024]
-
blk.25.attn_output.weightQ3_K[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightQ2_K[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ3_K[27392 5120]
-
blk.26.ffn_gate.weightQ2_K[5120 27392]
-
blk.26.ffn_up.weightQ2_K[5120 27392]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ2_K[5120 1024]
-
blk.26.attn_output.weightQ3_K[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightQ2_K[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ3_K[27392 5120]
-
blk.27.ffn_gate.weightQ2_K[5120 27392]
-
blk.27.ffn_up.weightQ2_K[5120 27392]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ2_K[5120 1024]
-
blk.27.attn_output.weightQ3_K[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightQ2_K[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.ffn_gate.weightQ2_K[5120 27392]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ2_K[5120 1024]
-
blk.28.attn_output.weightQ3_K[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightQ2_K[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ3_K[27392 5120]
-
blk.28.ffn_up.weightQ2_K[5120 27392]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ3_K[27392 5120]
-
blk.29.ffn_gate.weightQ2_K[5120 27392]
-
blk.29.ffn_up.weightQ2_K[5120 27392]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ2_K[5120 1024]
-
blk.29.attn_output.weightQ3_K[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightQ2_K[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ3_K[27392 5120]
-
blk.30.ffn_gate.weightQ2_K[5120 27392]
-
blk.30.ffn_up.weightQ2_K[5120 27392]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ2_K[5120 1024]
-
blk.30.attn_output.weightQ3_K[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightQ2_K[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ3_K[27392 5120]
-
blk.31.ffn_gate.weightQ2_K[5120 27392]
-
blk.31.ffn_up.weightQ2_K[5120 27392]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ2_K[5120 1024]
-
blk.31.attn_output.weightQ3_K[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightQ2_K[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ3_K[27392 5120]
-
blk.32.ffn_gate.weightQ2_K[5120 27392]
-
blk.32.ffn_up.weightQ2_K[5120 27392]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ2_K[5120 1024]
-
blk.32.attn_output.weightQ3_K[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightQ2_K[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.ffn_gate.weightQ2_K[5120 27392]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ2_K[5120 1024]
-
blk.33.attn_output.weightQ3_K[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightQ2_K[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ3_K[27392 5120]
-
blk.33.ffn_up.weightQ2_K[5120 27392]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ3_K[27392 5120]
-
blk.34.ffn_gate.weightQ2_K[5120 27392]
-
blk.34.ffn_up.weightQ2_K[5120 27392]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ2_K[5120 1024]
-
blk.34.attn_output.weightQ3_K[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightQ2_K[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ3_K[27392 5120]
-
blk.35.ffn_gate.weightQ2_K[5120 27392]
-
blk.35.ffn_up.weightQ2_K[5120 27392]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ2_K[5120 1024]
-
blk.35.attn_output.weightQ3_K[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightQ2_K[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ3_K[27392 5120]
-
blk.36.ffn_gate.weightQ2_K[5120 27392]
-
blk.36.ffn_up.weightQ2_K[5120 27392]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ2_K[5120 1024]
-
blk.36.attn_output.weightQ3_K[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightQ2_K[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ3_K[27392 5120]
-
blk.37.ffn_gate.weightQ2_K[5120 27392]
-
blk.37.ffn_up.weightQ2_K[5120 27392]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ2_K[5120 1024]
-
blk.37.attn_output.weightQ3_K[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightQ2_K[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.ffn_gate.weightQ2_K[5120 27392]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ2_K[5120 1024]
-
blk.38.attn_output.weightQ3_K[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightQ2_K[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ3_K[27392 5120]
-
blk.38.ffn_up.weightQ2_K[5120 27392]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ3_K[27392 5120]
-
blk.39.ffn_gate.weightQ2_K[5120 27392]
-
blk.39.ffn_up.weightQ2_K[5120 27392]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ2_K[5120 1024]
-
blk.39.attn_output.weightQ3_K[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightQ2_K[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightQ3_K[27392 5120]
-
blk.40.ffn_gate.weightQ2_K[5120 27392]
-
blk.40.ffn_up.weightQ2_K[5120 27392]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ2_K[5120 1024]
-
blk.40.attn_output.weightQ3_K[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightQ2_K[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightQ3_K[27392 5120]
-
blk.41.ffn_gate.weightQ2_K[5120 27392]
-
blk.41.ffn_up.weightQ2_K[5120 27392]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ2_K[5120 1024]
-
blk.41.attn_output.weightQ3_K[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightQ2_K[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightQ3_K[27392 5120]
-
blk.42.ffn_gate.weightQ2_K[5120 27392]
-
blk.42.ffn_up.weightQ2_K[5120 27392]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ2_K[5120 1024]
-
blk.42.attn_output.weightQ3_K[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightQ2_K[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[5120 1024]
-
blk.43.ffn_gate.weightQ2_K[5120 27392]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ2_K[5120 1024]
-
blk.43.attn_output.weightQ3_K[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightQ2_K[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[5120 1024]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightQ3_K[27392 5120]
-
blk.43.ffn_up.weightQ2_K[5120 27392]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightQ3_K[27392 5120]
-
blk.44.ffn_gate.weightQ2_K[5120 27392]
-
blk.44.ffn_up.weightQ2_K[5120 27392]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ2_K[5120 1024]
-
blk.44.attn_output.weightQ3_K[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightQ2_K[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightQ3_K[27392 5120]
-
blk.45.ffn_gate.weightQ2_K[5120 27392]
-
blk.45.ffn_up.weightQ2_K[5120 27392]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ2_K[5120 1024]
-
blk.45.attn_output.weightQ3_K[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightQ2_K[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightQ3_K[27392 5120]
-
blk.46.ffn_gate.weightQ2_K[5120 27392]
-
blk.46.ffn_up.weightQ2_K[5120 27392]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ2_K[5120 1024]
-
blk.46.attn_output.weightQ3_K[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightQ2_K[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[5120 1024]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightQ3_K[27392 5120]
-
blk.47.ffn_gate.weightQ2_K[5120 27392]
-
blk.47.ffn_up.weightQ2_K[5120 27392]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ2_K[5120 1024]
-
blk.47.attn_output.weightQ3_K[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightQ2_K[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[5120 1024]
-
blk.48.ffn_gate.weightQ2_K[5120 27392]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ2_K[5120 1024]
-
blk.48.attn_output.weightQ3_K[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightQ2_K[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightQ3_K[27392 5120]
-
blk.48.ffn_up.weightQ2_K[5120 27392]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightQ3_K[27392 5120]
-
blk.49.ffn_gate.weightQ2_K[5120 27392]
-
blk.49.ffn_up.weightQ2_K[5120 27392]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ2_K[5120 1024]
-
blk.49.attn_output.weightQ3_K[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightQ2_K[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightQ3_K[27392 5120]
-
blk.50.ffn_gate.weightQ2_K[5120 27392]
-
blk.50.ffn_up.weightQ2_K[5120 27392]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ2_K[5120 1024]
-
blk.50.attn_output.weightQ3_K[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightQ2_K[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[5120 1024]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightQ3_K[27392 5120]
-
blk.51.ffn_gate.weightQ2_K[5120 27392]
-
blk.51.ffn_up.weightQ2_K[5120 27392]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ2_K[5120 1024]
-
blk.51.attn_output.weightQ3_K[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightQ2_K[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightQ3_K[27392 5120]
-
blk.52.ffn_gate.weightQ2_K[5120 27392]
-
blk.52.ffn_up.weightQ2_K[5120 27392]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ2_K[5120 1024]
-
blk.52.attn_output.weightQ3_K[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightQ2_K[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[5120 1024]
-
blk.53.ffn_gate.weightQ2_K[5120 27392]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ2_K[5120 1024]
-
blk.53.attn_output.weightQ3_K[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightQ2_K[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[5120 1024]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightQ3_K[27392 5120]
-
blk.53.ffn_up.weightQ2_K[5120 27392]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightQ3_K[27392 5120]
-
blk.54.ffn_gate.weightQ2_K[5120 27392]
-
blk.54.ffn_up.weightQ2_K[5120 27392]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ2_K[5120 1024]
-
blk.54.attn_output.weightQ3_K[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightQ2_K[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[5120 1024]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightQ3_K[27392 5120]
-
blk.55.ffn_gate.weightQ2_K[5120 27392]
-
blk.55.ffn_up.weightQ2_K[5120 27392]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ2_K[5120 1024]
-
blk.55.attn_output.weightQ3_K[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightQ2_K[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightQ3_K[27392 5120]
-
blk.56.ffn_gate.weightQ2_K[5120 27392]
-
blk.56.ffn_up.weightQ2_K[5120 27392]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ2_K[5120 1024]
-
blk.56.attn_output.weightQ3_K[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightQ2_K[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[5120 1024]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightQ3_K[27392 5120]
-
blk.57.ffn_gate.weightQ2_K[5120 27392]
-
blk.57.ffn_up.weightQ2_K[5120 27392]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ2_K[5120 1024]
-
blk.57.attn_output.weightQ3_K[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightQ2_K[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[5120 1024]
-
blk.58.ffn_gate.weightQ2_K[5120 27392]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ2_K[5120 1024]
-
blk.58.attn_output.weightQ3_K[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightQ2_K[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightQ3_K[27392 5120]
-
blk.58.ffn_up.weightQ2_K[5120 27392]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightQ3_K[27392 5120]
-
blk.59.ffn_gate.weightQ2_K[5120 27392]
-
blk.59.ffn_up.weightQ2_K[5120 27392]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ2_K[5120 1024]
-
blk.59.attn_output.weightQ3_K[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightQ2_K[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightQ3_K[27392 5120]
-
blk.60.ffn_gate.weightQ2_K[5120 27392]
-
blk.60.ffn_up.weightQ2_K[5120 27392]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ2_K[5120 1024]
-
blk.60.attn_output.weightQ3_K[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightQ2_K[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[5120 1024]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightQ3_K[27392 5120]
-
blk.61.ffn_gate.weightQ2_K[5120 27392]
-
blk.61.ffn_up.weightQ2_K[5120 27392]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ2_K[5120 1024]
-
blk.61.attn_output.weightQ3_K[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightQ2_K[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightQ3_K[27392 5120]
-
blk.62.ffn_gate.weightQ2_K[5120 27392]
-
blk.62.ffn_up.weightQ2_K[5120 27392]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ2_K[5120 1024]
-
blk.62.attn_output.weightQ3_K[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightQ2_K[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[5120 1024]
-
blk.63.ffn_gate.weightQ2_K[5120 27392]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ2_K[5120 1024]
-
blk.63.attn_output.weightQ3_K[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightQ2_K[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[5120 1024]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightQ3_K[27392 5120]
-
blk.63.ffn_up.weightQ2_K[5120 27392]
-
blk.63.ffn_norm.weightF32[5120]
-
output.weightQ6_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63