latest
18GB
32B
Updated 2 days ago
f19896414f45 · 18GB
-
general.architectureqwen2
-
general.file_typeQ4_0
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27392
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[5120 152064]
-
blk.0.ffn_gate.weightQ4_0[5120 27392]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ4_0[5120 1024]
-
blk.0.attn_output.weightQ4_0[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightQ4_0[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_0[5120 1024]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ4_0[27392 5120]
-
blk.0.ffn_up.weightQ4_0[5120 27392]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ4_0[27392 5120]
-
blk.1.ffn_gate.weightQ4_0[5120 27392]
-
blk.1.ffn_up.weightQ4_0[5120 27392]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ4_0[5120 1024]
-
blk.1.attn_output.weightQ4_0[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightQ4_0[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_0[5120 1024]
-
blk.2.ffn_gate.weightQ4_0[5120 27392]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ4_0[5120 1024]
-
blk.2.attn_output.weightQ4_0[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightQ4_0[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_0[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ4_0[27392 5120]
-
blk.2.ffn_up.weightQ4_0[5120 27392]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_0[27392 5120]
-
blk.3.ffn_gate.weightQ4_0[5120 27392]
-
blk.3.ffn_up.weightQ4_0[5120 27392]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ4_0[5120 1024]
-
blk.3.attn_output.weightQ4_0[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightQ4_0[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_0[5120 1024]
-
blk.4.ffn_gate.weightQ4_0[5120 27392]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ4_0[5120 1024]
-
blk.4.attn_output.weightQ4_0[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightQ4_0[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_0[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_0[27392 5120]
-
blk.4.ffn_up.weightQ4_0[5120 27392]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_0[27392 5120]
-
blk.5.ffn_gate.weightQ4_0[5120 27392]
-
blk.5.ffn_up.weightQ4_0[5120 27392]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ4_0[5120 1024]
-
blk.5.attn_output.weightQ4_0[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightQ4_0[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_0[5120 1024]
-
blk.6.ffn_gate.weightQ4_0[5120 27392]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ4_0[5120 1024]
-
blk.6.attn_output.weightQ4_0[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightQ4_0[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_0[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_0[27392 5120]
-
blk.6.ffn_up.weightQ4_0[5120 27392]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_0[27392 5120]
-
blk.7.ffn_gate.weightQ4_0[5120 27392]
-
blk.7.ffn_up.weightQ4_0[5120 27392]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ4_0[5120 1024]
-
blk.7.attn_output.weightQ4_0[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightQ4_0[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_0[5120 1024]
-
blk.8.ffn_gate.weightQ4_0[5120 27392]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ4_0[5120 1024]
-
blk.8.attn_output.weightQ4_0[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightQ4_0[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_0[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_0[27392 5120]
-
blk.8.ffn_up.weightQ4_0[5120 27392]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_0[27392 5120]
-
blk.9.ffn_gate.weightQ4_0[5120 27392]
-
blk.9.ffn_up.weightQ4_0[5120 27392]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ4_0[5120 1024]
-
blk.9.attn_output.weightQ4_0[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightQ4_0[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_0[5120 1024]
-
blk.10.ffn_gate.weightQ4_0[5120 27392]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ4_0[5120 1024]
-
blk.10.attn_output.weightQ4_0[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightQ4_0[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_0[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_0[27392 5120]
-
blk.10.ffn_up.weightQ4_0[5120 27392]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ4_0[27392 5120]
-
blk.11.ffn_gate.weightQ4_0[5120 27392]
-
blk.11.ffn_up.weightQ4_0[5120 27392]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ4_0[5120 1024]
-
blk.11.attn_output.weightQ4_0[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightQ4_0[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_0[5120 1024]
-
blk.12.ffn_gate.weightQ4_0[5120 27392]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ4_0[5120 1024]
-
blk.12.attn_output.weightQ4_0[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightQ4_0[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_0[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ4_0[27392 5120]
-
blk.12.ffn_up.weightQ4_0[5120 27392]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_0[27392 5120]
-
blk.13.ffn_gate.weightQ4_0[5120 27392]
-
blk.13.ffn_up.weightQ4_0[5120 27392]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ4_0[5120 1024]
-
blk.13.attn_output.weightQ4_0[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightQ4_0[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_0[5120 1024]
-
blk.14.ffn_gate.weightQ4_0[5120 27392]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ4_0[5120 1024]
-
blk.14.attn_output.weightQ4_0[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightQ4_0[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_0[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_0[27392 5120]
-
blk.14.ffn_up.weightQ4_0[5120 27392]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_0[27392 5120]
-
blk.15.ffn_gate.weightQ4_0[5120 27392]
-
blk.15.ffn_up.weightQ4_0[5120 27392]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ4_0[5120 1024]
-
blk.15.attn_output.weightQ4_0[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightQ4_0[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_0[5120 1024]
-
blk.16.ffn_gate.weightQ4_0[5120 27392]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ4_0[5120 1024]
-
blk.16.attn_output.weightQ4_0[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightQ4_0[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_0[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ4_0[27392 5120]
-
blk.16.ffn_up.weightQ4_0[5120 27392]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_0[27392 5120]
-
blk.17.ffn_gate.weightQ4_0[5120 27392]
-
blk.17.ffn_up.weightQ4_0[5120 27392]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ4_0[5120 1024]
-
blk.17.attn_output.weightQ4_0[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightQ4_0[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_0[5120 1024]
-
blk.18.ffn_gate.weightQ4_0[5120 27392]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ4_0[5120 1024]
-
blk.18.attn_output.weightQ4_0[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightQ4_0[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_0[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_0[27392 5120]
-
blk.18.ffn_up.weightQ4_0[5120 27392]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ4_0[27392 5120]
-
blk.19.ffn_gate.weightQ4_0[5120 27392]
-
blk.19.ffn_up.weightQ4_0[5120 27392]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ4_0[5120 1024]
-
blk.19.attn_output.weightQ4_0[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightQ4_0[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_0[5120 1024]
-
blk.20.ffn_gate.weightQ4_0[5120 27392]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ4_0[5120 1024]
-
blk.20.attn_output.weightQ4_0[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightQ4_0[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_0[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_0[27392 5120]
-
blk.20.ffn_up.weightQ4_0[5120 27392]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_0[27392 5120]
-
blk.21.ffn_gate.weightQ4_0[5120 27392]
-
blk.21.ffn_up.weightQ4_0[5120 27392]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ4_0[5120 1024]
-
blk.21.attn_output.weightQ4_0[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightQ4_0[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_0[5120 1024]
-
blk.22.ffn_gate.weightQ4_0[5120 27392]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ4_0[5120 1024]
-
blk.22.attn_output.weightQ4_0[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightQ4_0[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_0[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ4_0[27392 5120]
-
blk.22.ffn_up.weightQ4_0[5120 27392]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_0[27392 5120]
-
blk.23.ffn_gate.weightQ4_0[5120 27392]
-
blk.23.ffn_up.weightQ4_0[5120 27392]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ4_0[5120 1024]
-
blk.23.attn_output.weightQ4_0[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightQ4_0[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_0[5120 1024]
-
blk.24.ffn_gate.weightQ4_0[5120 27392]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ4_0[5120 1024]
-
blk.24.attn_output.weightQ4_0[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightQ4_0[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_0[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_0[27392 5120]
-
blk.24.ffn_up.weightQ4_0[5120 27392]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ4_0[27392 5120]
-
blk.25.ffn_gate.weightQ4_0[5120 27392]
-
blk.25.ffn_up.weightQ4_0[5120 27392]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ4_0[5120 1024]
-
blk.25.attn_output.weightQ4_0[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightQ4_0[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_0[5120 1024]
-
blk.26.ffn_gate.weightQ4_0[5120 27392]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ4_0[5120 1024]
-
blk.26.attn_output.weightQ4_0[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightQ4_0[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_0[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_0[27392 5120]
-
blk.26.ffn_up.weightQ4_0[5120 27392]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_0[27392 5120]
-
blk.27.ffn_gate.weightQ4_0[5120 27392]
-
blk.27.ffn_up.weightQ4_0[5120 27392]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ4_0[5120 1024]
-
blk.27.attn_output.weightQ4_0[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightQ4_0[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_0[5120 1024]
-
blk.28.ffn_gate.weightQ4_0[5120 27392]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ4_0[5120 1024]
-
blk.28.attn_output.weightQ4_0[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightQ4_0[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_0[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ4_0[27392 5120]
-
blk.28.ffn_up.weightQ4_0[5120 27392]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_0[27392 5120]
-
blk.29.ffn_gate.weightQ4_0[5120 27392]
-
blk.29.ffn_up.weightQ4_0[5120 27392]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ4_0[5120 1024]
-
blk.29.attn_output.weightQ4_0[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightQ4_0[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_0[5120 1024]
-
blk.30.ffn_gate.weightQ4_0[5120 27392]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ4_0[5120 1024]
-
blk.30.attn_output.weightQ4_0[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightQ4_0[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_0[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_0[27392 5120]
-
blk.30.ffn_up.weightQ4_0[5120 27392]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ4_0[27392 5120]
-
blk.31.ffn_gate.weightQ4_0[5120 27392]
-
blk.31.ffn_up.weightQ4_0[5120 27392]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ4_0[5120 1024]
-
blk.31.attn_output.weightQ4_0[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightQ4_0[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_0[5120 1024]
-
blk.32.ffn_gate.weightQ4_0[5120 27392]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ4_0[5120 1024]
-
blk.32.attn_output.weightQ4_0[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightQ4_0[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_0[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_0[27392 5120]
-
blk.32.ffn_up.weightQ4_0[5120 27392]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_0[27392 5120]
-
blk.33.ffn_gate.weightQ4_0[5120 27392]
-
blk.33.ffn_up.weightQ4_0[5120 27392]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ4_0[5120 1024]
-
blk.33.attn_output.weightQ4_0[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightQ4_0[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_0[5120 1024]
-
blk.34.ffn_gate.weightQ4_0[5120 27392]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ4_0[5120 1024]
-
blk.34.attn_output.weightQ4_0[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightQ4_0[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_0[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ4_0[27392 5120]
-
blk.34.ffn_up.weightQ4_0[5120 27392]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ4_0[27392 5120]
-
blk.35.ffn_gate.weightQ4_0[5120 27392]
-
blk.35.ffn_up.weightQ4_0[5120 27392]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ4_0[5120 1024]
-
blk.35.attn_output.weightQ4_0[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightQ4_0[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_0[5120 1024]
-
blk.36.ffn_gate.weightQ4_0[5120 27392]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ4_0[5120 1024]
-
blk.36.attn_output.weightQ4_0[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightQ4_0[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_0[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ4_0[27392 5120]
-
blk.36.ffn_up.weightQ4_0[5120 27392]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ4_0[27392 5120]
-
blk.37.ffn_gate.weightQ4_0[5120 27392]
-
blk.37.ffn_up.weightQ4_0[5120 27392]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ4_0[5120 1024]
-
blk.37.attn_output.weightQ4_0[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightQ4_0[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_0[5120 1024]
-
blk.38.ffn_gate.weightQ4_0[5120 27392]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ4_0[5120 1024]
-
blk.38.attn_output.weightQ4_0[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightQ4_0[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_0[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ4_0[27392 5120]
-
blk.38.ffn_up.weightQ4_0[5120 27392]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ4_0[27392 5120]
-
blk.39.ffn_gate.weightQ4_0[5120 27392]
-
blk.39.ffn_up.weightQ4_0[5120 27392]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ4_0[5120 1024]
-
blk.39.attn_output.weightQ4_0[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightQ4_0[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_0[5120 1024]
-
blk.40.ffn_gate.weightQ4_0[5120 27392]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ4_0[5120 1024]
-
blk.40.attn_output.weightQ4_0[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightQ4_0[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_0[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightQ4_0[27392 5120]
-
blk.40.ffn_up.weightQ4_0[5120 27392]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightQ4_0[27392 5120]
-
blk.41.ffn_gate.weightQ4_0[5120 27392]
-
blk.41.ffn_up.weightQ4_0[5120 27392]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ4_0[5120 1024]
-
blk.41.attn_output.weightQ4_0[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightQ4_0[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_0[5120 1024]
-
blk.42.ffn_gate.weightQ4_0[5120 27392]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ4_0[5120 1024]
-
blk.42.attn_output.weightQ4_0[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightQ4_0[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_0[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightQ4_0[27392 5120]
-
blk.42.ffn_up.weightQ4_0[5120 27392]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightQ4_0[27392 5120]
-
blk.43.ffn_gate.weightQ4_0[5120 27392]
-
blk.43.ffn_up.weightQ4_0[5120 27392]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ4_0[5120 1024]
-
blk.43.attn_output.weightQ4_0[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightQ4_0[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_0[5120 1024]
-
blk.44.ffn_gate.weightQ4_0[5120 27392]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ4_0[5120 1024]
-
blk.44.attn_output.weightQ4_0[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightQ4_0[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_0[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightQ4_0[27392 5120]
-
blk.44.ffn_up.weightQ4_0[5120 27392]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightQ4_0[27392 5120]
-
blk.45.ffn_gate.weightQ4_0[5120 27392]
-
blk.45.ffn_up.weightQ4_0[5120 27392]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ4_0[5120 1024]
-
blk.45.attn_output.weightQ4_0[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightQ4_0[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_0[5120 1024]
-
blk.46.ffn_gate.weightQ4_0[5120 27392]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ4_0[5120 1024]
-
blk.46.attn_output.weightQ4_0[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightQ4_0[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_0[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightQ4_0[27392 5120]
-
blk.46.ffn_up.weightQ4_0[5120 27392]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightQ4_0[27392 5120]
-
blk.47.ffn_gate.weightQ4_0[5120 27392]
-
blk.47.ffn_up.weightQ4_0[5120 27392]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ4_0[5120 1024]
-
blk.47.attn_output.weightQ4_0[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightQ4_0[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_0[5120 1024]
-
blk.48.ffn_gate.weightQ4_0[5120 27392]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ4_0[5120 1024]
-
blk.48.attn_output.weightQ4_0[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightQ4_0[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_0[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightQ4_0[27392 5120]
-
blk.48.ffn_up.weightQ4_0[5120 27392]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightQ4_0[27392 5120]
-
blk.49.ffn_gate.weightQ4_0[5120 27392]
-
blk.49.ffn_up.weightQ4_0[5120 27392]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ4_0[5120 1024]
-
blk.49.attn_output.weightQ4_0[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightQ4_0[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_0[5120 1024]
-
blk.50.ffn_gate.weightQ4_0[5120 27392]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ4_0[5120 1024]
-
blk.50.attn_output.weightQ4_0[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightQ4_0[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_0[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightQ4_0[27392 5120]
-
blk.50.ffn_up.weightQ4_0[5120 27392]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightQ4_0[27392 5120]
-
blk.51.ffn_gate.weightQ4_0[5120 27392]
-
blk.51.ffn_up.weightQ4_0[5120 27392]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ4_0[5120 1024]
-
blk.51.attn_output.weightQ4_0[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightQ4_0[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_0[5120 1024]
-
blk.52.ffn_gate.weightQ4_0[5120 27392]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ4_0[5120 1024]
-
blk.52.attn_output.weightQ4_0[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightQ4_0[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_0[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightQ4_0[27392 5120]
-
blk.52.ffn_up.weightQ4_0[5120 27392]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightQ4_0[27392 5120]
-
blk.53.ffn_gate.weightQ4_0[5120 27392]
-
blk.53.ffn_up.weightQ4_0[5120 27392]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ4_0[5120 1024]
-
blk.53.attn_output.weightQ4_0[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightQ4_0[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_0[5120 1024]
-
blk.54.ffn_gate.weightQ4_0[5120 27392]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ4_0[5120 1024]
-
blk.54.attn_output.weightQ4_0[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightQ4_0[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_0[5120 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightQ4_0[27392 5120]
-
blk.54.ffn_up.weightQ4_0[5120 27392]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightQ4_0[27392 5120]
-
blk.55.ffn_gate.weightQ4_0[5120 27392]
-
blk.55.ffn_up.weightQ4_0[5120 27392]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ4_0[5120 1024]
-
blk.55.attn_output.weightQ4_0[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightQ4_0[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_0[5120 1024]
-
blk.56.ffn_gate.weightQ4_0[5120 27392]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ4_0[5120 1024]
-
blk.56.attn_output.weightQ4_0[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightQ4_0[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_0[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightQ4_0[27392 5120]
-
blk.56.ffn_up.weightQ4_0[5120 27392]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightQ4_0[27392 5120]
-
blk.57.ffn_gate.weightQ4_0[5120 27392]
-
blk.57.ffn_up.weightQ4_0[5120 27392]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ4_0[5120 1024]
-
blk.57.attn_output.weightQ4_0[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightQ4_0[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_0[5120 1024]
-
blk.58.ffn_gate.weightQ4_0[5120 27392]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ4_0[5120 1024]
-
blk.58.attn_output.weightQ4_0[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightQ4_0[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_0[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightQ4_0[27392 5120]
-
blk.58.ffn_up.weightQ4_0[5120 27392]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightQ4_0[27392 5120]
-
blk.59.ffn_gate.weightQ4_0[5120 27392]
-
blk.59.ffn_up.weightQ4_0[5120 27392]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ4_0[5120 1024]
-
blk.59.attn_output.weightQ4_0[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightQ4_0[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_0[5120 1024]
-
blk.60.ffn_gate.weightQ4_0[5120 27392]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ4_0[5120 1024]
-
blk.60.attn_output.weightQ4_0[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightQ4_0[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_0[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightQ4_0[27392 5120]
-
blk.60.ffn_up.weightQ4_0[5120 27392]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightQ4_0[27392 5120]
-
blk.61.ffn_gate.weightQ4_0[5120 27392]
-
blk.61.ffn_up.weightQ4_0[5120 27392]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ4_0[5120 1024]
-
blk.61.attn_output.weightQ4_0[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightQ4_0[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_0[5120 1024]
-
blk.62.ffn_gate.weightQ4_0[5120 27392]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ4_0[5120 1024]
-
blk.62.attn_output.weightQ4_0[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightQ4_0[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_0[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightQ4_0[27392 5120]
-
blk.62.ffn_up.weightQ4_0[5120 27392]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightQ4_0[27392 5120]
-
blk.63.ffn_gate.weightQ4_0[5120 27392]
-
blk.63.ffn_up.weightQ4_0[5120 27392]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ4_0[5120 1024]
-
blk.63.attn_output.weightQ4_0[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightQ4_0[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_0[5120 1024]
-
output_norm.weightF32[5120]
-
output.weightQ6_K[5120 152064]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63