latest
8.2GB
61 Pulls Updated 5 months ago
de0334402b97 · 8.2GB
-
general.architectureqwen2
-
general.file_typeQ4_0
-
general.quantization_version2
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv40
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count40
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length13696
-
qwen2.use_parallel_residualtrue
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151643
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ4_0[13696 5120]
-
blk.0.ffn_gate.weightQ4_0[5120 13696]
-
blk.0.ffn_up.weightQ4_0[5120 13696]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[5120]
-
blk.0.attn_k.weightQ4_0[5120 5120]
-
blk.0.attn_output.weightQ4_0[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightQ4_0[5120 5120]
-
blk.0.attn_v.biasF32[5120]
-
blk.0.attn_v.weightQ4_0[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ4_0[13696 5120]
-
blk.1.ffn_gate.weightQ4_0[5120 13696]
-
blk.1.ffn_up.weightQ4_0[5120 13696]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[5120]
-
blk.1.attn_k.weightQ4_0[5120 5120]
-
blk.1.attn_output.weightQ4_0[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightQ4_0[5120 5120]
-
blk.1.attn_v.biasF32[5120]
-
blk.1.attn_v.weightQ4_0[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ4_0[13696 5120]
-
blk.2.ffn_gate.weightQ4_0[5120 13696]
-
blk.2.ffn_up.weightQ4_0[5120 13696]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[5120]
-
blk.2.attn_k.weightQ4_0[5120 5120]
-
blk.2.attn_output.weightQ4_0[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightQ4_0[5120 5120]
-
blk.2.attn_v.biasF32[5120]
-
blk.2.attn_v.weightQ4_0[5120 5120]
-
blk.3.ffn_gate.weightQ4_0[5120 13696]
-
blk.3.ffn_up.weightQ4_0[5120 13696]
-
blk.3.attn_k.biasF32[5120]
-
blk.3.attn_k.weightQ4_0[5120 5120]
-
blk.3.attn_output.weightQ4_0[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightQ4_0[5120 5120]
-
blk.3.attn_v.biasF32[5120]
-
blk.3.attn_v.weightQ4_0[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_0[13696 5120]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_0[13696 5120]
-
blk.4.ffn_gate.weightQ4_0[5120 13696]
-
blk.4.ffn_up.weightQ4_0[5120 13696]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[5120]
-
blk.4.attn_k.weightQ4_0[5120 5120]
-
blk.4.attn_output.weightQ4_0[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightQ4_0[5120 5120]
-
blk.4.attn_v.biasF32[5120]
-
blk.4.attn_v.weightQ4_0[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_0[13696 5120]
-
blk.5.ffn_gate.weightQ4_0[5120 13696]
-
blk.5.ffn_up.weightQ4_0[5120 13696]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[5120]
-
blk.5.attn_k.weightQ4_0[5120 5120]
-
blk.5.attn_output.weightQ4_0[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightQ4_0[5120 5120]
-
blk.5.attn_v.biasF32[5120]
-
blk.5.attn_v.weightQ4_0[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_0[13696 5120]
-
blk.6.ffn_gate.weightQ4_0[5120 13696]
-
blk.6.ffn_up.weightQ4_0[5120 13696]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[5120]
-
blk.6.attn_k.weightQ4_0[5120 5120]
-
blk.6.attn_output.weightQ4_0[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightQ4_0[5120 5120]
-
blk.6.attn_v.biasF32[5120]
-
blk.6.attn_v.weightQ4_0[5120 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_0[13696 5120]
-
blk.7.ffn_gate.weightQ4_0[5120 13696]
-
blk.7.ffn_up.weightQ4_0[5120 13696]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[5120]
-
blk.7.attn_k.weightQ4_0[5120 5120]
-
blk.7.attn_output.weightQ4_0[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightQ4_0[5120 5120]
-
blk.7.attn_v.biasF32[5120]
-
blk.7.attn_v.weightQ4_0[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_0[13696 5120]
-
blk.8.ffn_gate.weightQ4_0[5120 13696]
-
blk.8.ffn_up.weightQ4_0[5120 13696]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[5120]
-
blk.8.attn_k.weightQ4_0[5120 5120]
-
blk.8.attn_output.weightQ4_0[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightQ4_0[5120 5120]
-
blk.8.attn_v.biasF32[5120]
-
blk.8.attn_v.weightQ4_0[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_0[13696 5120]
-
blk.9.ffn_gate.weightQ4_0[5120 13696]
-
blk.9.ffn_up.weightQ4_0[5120 13696]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[5120]
-
blk.9.attn_k.weightQ4_0[5120 5120]
-
blk.9.attn_output.weightQ4_0[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightQ4_0[5120 5120]
-
blk.9.attn_v.biasF32[5120]
-
blk.9.attn_v.weightQ4_0[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightQ4_0[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_0[13696 5120]
-
blk.10.ffn_gate.weightQ4_0[5120 13696]
-
blk.10.ffn_up.weightQ4_0[5120 13696]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[5120]
-
blk.10.attn_k.weightQ4_0[5120 5120]
-
blk.10.attn_output.weightQ4_0[5120 5120]
-
blk.10.attn_v.biasF32[5120]
-
blk.10.attn_v.weightQ4_0[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ4_0[13696 5120]
-
blk.11.ffn_gate.weightQ4_0[5120 13696]
-
blk.11.ffn_up.weightQ4_0[5120 13696]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[5120]
-
blk.11.attn_k.weightQ4_0[5120 5120]
-
blk.11.attn_output.weightQ4_0[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightQ4_0[5120 5120]
-
blk.11.attn_v.biasF32[5120]
-
blk.11.attn_v.weightQ4_0[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ4_0[13696 5120]
-
blk.12.ffn_gate.weightQ4_0[5120 13696]
-
blk.12.ffn_up.weightQ4_0[5120 13696]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[5120]
-
blk.12.attn_k.weightQ4_0[5120 5120]
-
blk.12.attn_output.weightQ4_0[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightQ4_0[5120 5120]
-
blk.12.attn_v.biasF32[5120]
-
blk.12.attn_v.weightQ4_0[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_0[13696 5120]
-
blk.13.ffn_gate.weightQ4_0[5120 13696]
-
blk.13.ffn_up.weightQ4_0[5120 13696]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[5120]
-
blk.13.attn_k.weightQ4_0[5120 5120]
-
blk.13.attn_output.weightQ4_0[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightQ4_0[5120 5120]
-
blk.13.attn_v.biasF32[5120]
-
blk.13.attn_v.weightQ4_0[5120 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_0[13696 5120]
-
blk.14.ffn_gate.weightQ4_0[5120 13696]
-
blk.14.ffn_up.weightQ4_0[5120 13696]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[5120]
-
blk.14.attn_k.weightQ4_0[5120 5120]
-
blk.14.attn_output.weightQ4_0[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightQ4_0[5120 5120]
-
blk.14.attn_v.biasF32[5120]
-
blk.14.attn_v.weightQ4_0[5120 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_0[13696 5120]
-
blk.15.ffn_gate.weightQ4_0[5120 13696]
-
blk.15.ffn_up.weightQ4_0[5120 13696]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[5120]
-
blk.15.attn_k.weightQ4_0[5120 5120]
-
blk.15.attn_output.weightQ4_0[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightQ4_0[5120 5120]
-
blk.15.attn_v.biasF32[5120]
-
blk.15.attn_v.weightQ4_0[5120 5120]
-
blk.16.attn_k.biasF32[5120]
-
blk.16.attn_k.weightQ4_0[5120 5120]
-
blk.16.attn_output.weightQ4_0[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightQ4_0[5120 5120]
-
blk.16.attn_v.biasF32[5120]
-
blk.16.attn_v.weightQ4_0[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ4_0[13696 5120]
-
blk.16.ffn_gate.weightQ4_0[5120 13696]
-
blk.16.ffn_up.weightQ4_0[5120 13696]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_0[13696 5120]
-
blk.17.ffn_gate.weightQ4_0[5120 13696]
-
blk.17.ffn_up.weightQ4_0[5120 13696]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[5120]
-
blk.17.attn_k.weightQ4_0[5120 5120]
-
blk.17.attn_output.weightQ4_0[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightQ4_0[5120 5120]
-
blk.17.attn_v.biasF32[5120]
-
blk.17.attn_v.weightQ4_0[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_0[13696 5120]
-
blk.18.ffn_gate.weightQ4_0[5120 13696]
-
blk.18.ffn_up.weightQ4_0[5120 13696]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[5120]
-
blk.18.attn_k.weightQ4_0[5120 5120]
-
blk.18.attn_output.weightQ4_0[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightQ4_0[5120 5120]
-
blk.18.attn_v.biasF32[5120]
-
blk.18.attn_v.weightQ4_0[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ4_0[13696 5120]
-
blk.19.ffn_gate.weightQ4_0[5120 13696]
-
blk.19.ffn_up.weightQ4_0[5120 13696]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[5120]
-
blk.19.attn_k.weightQ4_0[5120 5120]
-
blk.19.attn_output.weightQ4_0[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightQ4_0[5120 5120]
-
blk.19.attn_v.biasF32[5120]
-
blk.19.attn_v.weightQ4_0[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_0[13696 5120]
-
blk.20.ffn_gate.weightQ4_0[5120 13696]
-
blk.20.ffn_up.weightQ4_0[5120 13696]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[5120]
-
blk.20.attn_k.weightQ4_0[5120 5120]
-
blk.20.attn_output.weightQ4_0[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightQ4_0[5120 5120]
-
blk.20.attn_v.biasF32[5120]
-
blk.20.attn_v.weightQ4_0[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_0[13696 5120]
-
blk.21.ffn_gate.weightQ4_0[5120 13696]
-
blk.21.ffn_up.weightQ4_0[5120 13696]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[5120]
-
blk.21.attn_k.weightQ4_0[5120 5120]
-
blk.21.attn_output.weightQ4_0[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightQ4_0[5120 5120]
-
blk.21.attn_v.biasF32[5120]
-
blk.21.attn_v.weightQ4_0[5120 5120]
-
blk.22.ffn_gate.weightQ4_0[5120 13696]
-
blk.22.attn_k.biasF32[5120]
-
blk.22.attn_k.weightQ4_0[5120 5120]
-
blk.22.attn_output.weightQ4_0[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightQ4_0[5120 5120]
-
blk.22.attn_v.biasF32[5120]
-
blk.22.attn_v.weightQ4_0[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ4_0[13696 5120]
-
blk.22.ffn_up.weightQ4_0[5120 13696]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_0[13696 5120]
-
blk.23.ffn_gate.weightQ4_0[5120 13696]
-
blk.23.ffn_up.weightQ4_0[5120 13696]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[5120]
-
blk.23.attn_k.weightQ4_0[5120 5120]
-
blk.23.attn_output.weightQ4_0[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightQ4_0[5120 5120]
-
blk.23.attn_v.biasF32[5120]
-
blk.23.attn_v.weightQ4_0[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_0[13696 5120]
-
blk.24.ffn_gate.weightQ4_0[5120 13696]
-
blk.24.ffn_up.weightQ4_0[5120 13696]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[5120]
-
blk.24.attn_k.weightQ4_0[5120 5120]
-
blk.24.attn_output.weightQ4_0[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightQ4_0[5120 5120]
-
blk.24.attn_v.biasF32[5120]
-
blk.24.attn_v.weightQ4_0[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ4_0[13696 5120]
-
blk.25.ffn_gate.weightQ4_0[5120 13696]
-
blk.25.ffn_up.weightQ4_0[5120 13696]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[5120]
-
blk.25.attn_k.weightQ4_0[5120 5120]
-
blk.25.attn_output.weightQ4_0[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightQ4_0[5120 5120]
-
blk.25.attn_v.biasF32[5120]
-
blk.25.attn_v.weightQ4_0[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_0[13696 5120]
-
blk.26.ffn_gate.weightQ4_0[5120 13696]
-
blk.26.ffn_up.weightQ4_0[5120 13696]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[5120]
-
blk.26.attn_k.weightQ4_0[5120 5120]
-
blk.26.attn_output.weightQ4_0[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightQ4_0[5120 5120]
-
blk.26.attn_v.biasF32[5120]
-
blk.26.attn_v.weightQ4_0[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_0[13696 5120]
-
blk.27.ffn_gate.weightQ4_0[5120 13696]
-
blk.27.ffn_up.weightQ4_0[5120 13696]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[5120]
-
blk.27.attn_k.weightQ4_0[5120 5120]
-
blk.27.attn_output.weightQ4_0[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightQ4_0[5120 5120]
-
blk.27.attn_v.biasF32[5120]
-
blk.27.attn_v.weightQ4_0[5120 5120]
-
blk.28.ffn_gate.weightQ4_0[5120 13696]
-
blk.28.ffn_up.weightQ4_0[5120 13696]
-
blk.28.attn_k.biasF32[5120]
-
blk.28.attn_k.weightQ4_0[5120 5120]
-
blk.28.attn_output.weightQ4_0[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightQ4_0[5120 5120]
-
blk.28.attn_v.biasF32[5120]
-
blk.28.attn_v.weightQ4_0[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ4_0[13696 5120]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_0[13696 5120]
-
blk.29.ffn_gate.weightQ4_0[5120 13696]
-
blk.29.ffn_up.weightQ4_0[5120 13696]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[5120]
-
blk.29.attn_k.weightQ4_0[5120 5120]
-
blk.29.attn_output.weightQ4_0[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightQ4_0[5120 5120]
-
blk.29.attn_v.biasF32[5120]
-
blk.29.attn_v.weightQ4_0[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_0[13696 5120]
-
blk.30.ffn_gate.weightQ4_0[5120 13696]
-
blk.30.ffn_up.weightQ4_0[5120 13696]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[5120]
-
blk.30.attn_k.weightQ4_0[5120 5120]
-
blk.30.attn_output.weightQ4_0[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightQ4_0[5120 5120]
-
blk.30.attn_v.biasF32[5120]
-
blk.30.attn_v.weightQ4_0[5120 5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ4_0[13696 5120]
-
blk.31.ffn_gate.weightQ4_0[5120 13696]
-
blk.31.ffn_up.weightQ4_0[5120 13696]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[5120]
-
blk.31.attn_k.weightQ4_0[5120 5120]
-
blk.31.attn_output.weightQ4_0[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightQ4_0[5120 5120]
-
blk.31.attn_v.biasF32[5120]
-
blk.31.attn_v.weightQ4_0[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_0[13696 5120]
-
blk.32.ffn_gate.weightQ4_0[5120 13696]
-
blk.32.ffn_up.weightQ4_0[5120 13696]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[5120]
-
blk.32.attn_k.weightQ4_0[5120 5120]
-
blk.32.attn_output.weightQ4_0[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightQ4_0[5120 5120]
-
blk.32.attn_v.biasF32[5120]
-
blk.32.attn_v.weightQ4_0[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_0[13696 5120]
-
blk.33.ffn_gate.weightQ4_0[5120 13696]
-
blk.33.ffn_up.weightQ4_0[5120 13696]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[5120]
-
blk.33.attn_k.weightQ4_0[5120 5120]
-
blk.33.attn_output.weightQ4_0[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightQ4_0[5120 5120]
-
blk.33.attn_v.biasF32[5120]
-
blk.33.attn_v.weightQ4_0[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ4_0[13696 5120]
-
blk.34.ffn_gate.weightQ4_0[5120 13696]
-
blk.34.ffn_up.weightQ4_0[5120 13696]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[5120]
-
blk.34.attn_k.weightQ4_0[5120 5120]
-
blk.34.attn_output.weightQ4_0[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightQ4_0[5120 5120]
-
blk.34.attn_v.biasF32[5120]
-
blk.34.attn_v.weightQ4_0[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightQ4_0[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ4_0[13696 5120]
-
blk.35.ffn_gate.weightQ4_0[5120 13696]
-
blk.35.ffn_up.weightQ4_0[5120 13696]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[5120]
-
blk.35.attn_k.weightQ4_0[5120 5120]
-
blk.35.attn_output.weightQ4_0[5120 5120]
-
blk.35.attn_v.biasF32[5120]
-
blk.35.attn_v.weightQ4_0[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ4_0[13696 5120]
-
blk.36.ffn_gate.weightQ4_0[5120 13696]
-
blk.36.ffn_up.weightQ4_0[5120 13696]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[5120]
-
blk.36.attn_k.weightQ4_0[5120 5120]
-
blk.36.attn_output.weightQ4_0[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightQ4_0[5120 5120]
-
blk.36.attn_v.biasF32[5120]
-
blk.36.attn_v.weightQ4_0[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ4_0[13696 5120]
-
blk.37.ffn_gate.weightQ4_0[5120 13696]
-
blk.37.ffn_up.weightQ4_0[5120 13696]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[5120]
-
blk.37.attn_k.weightQ4_0[5120 5120]
-
blk.37.attn_output.weightQ4_0[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightQ4_0[5120 5120]
-
blk.37.attn_v.biasF32[5120]
-
blk.37.attn_v.weightQ4_0[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ4_0[13696 5120]
-
blk.38.ffn_gate.weightQ4_0[5120 13696]
-
blk.38.ffn_up.weightQ4_0[5120 13696]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[5120]
-
blk.38.attn_k.weightQ4_0[5120 5120]
-
blk.38.attn_output.weightQ4_0[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightQ4_0[5120 5120]
-
blk.38.attn_v.biasF32[5120]
-
blk.38.attn_v.weightQ4_0[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ4_0[13696 5120]
-
blk.39.ffn_gate.weightQ4_0[5120 13696]
-
blk.39.ffn_up.weightQ4_0[5120 13696]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[5120]
-
blk.39.attn_k.weightQ4_0[5120 5120]
-
blk.39.attn_output.weightQ4_0[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightQ4_0[5120 5120]
-
blk.39.attn_v.biasF32[5120]
-
blk.39.attn_v.weightQ4_0[5120 5120]
-
output_norm.weightF32[5120]
-
output.weightQ6_K[5120 152064]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39