latest
41GB
72B
Updated 2 days ago
7bf41a59b4b0 · 41GB
-
general.architectureqwen2
-
general.file_typeQ4_0
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count80
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[8192 152064]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[29568 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 29568]
-
blk.0.ffn_up.weightQ4_0[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[29568 8192]
-
blk.1.ffn_gate.weightQ4_0[8192 29568]
-
blk.1.ffn_up.weightQ4_0[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[29568 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 29568]
-
blk.2.ffn_up.weightQ4_0[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[29568 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 29568]
-
blk.3.ffn_up.weightQ4_0[8192 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[29568 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 29568]
-
blk.4.ffn_up.weightQ4_0[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[29568 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 29568]
-
blk.5.ffn_up.weightQ4_0[8192 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[29568 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 29568]
-
blk.6.ffn_up.weightQ4_0[8192 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[29568 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 29568]
-
blk.7.ffn_up.weightQ4_0[8192 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[29568 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 29568]
-
blk.8.ffn_up.weightQ4_0[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[29568 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 29568]
-
blk.9.ffn_up.weightQ4_0[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[29568 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 29568]
-
blk.10.ffn_up.weightQ4_0[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[29568 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 29568]
-
blk.11.ffn_up.weightQ4_0[8192 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[29568 8192]
-
blk.12.ffn_gate.weightQ4_0[8192 29568]
-
blk.12.ffn_up.weightQ4_0[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[29568 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 29568]
-
blk.13.ffn_up.weightQ4_0[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[29568 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 29568]
-
blk.14.ffn_up.weightQ4_0[8192 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[29568 8192]
-
blk.15.ffn_gate.weightQ4_0[8192 29568]
-
blk.15.ffn_up.weightQ4_0[8192 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[29568 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 29568]
-
blk.16.ffn_up.weightQ4_0[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[29568 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 29568]
-
blk.17.ffn_up.weightQ4_0[8192 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[29568 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 29568]
-
blk.18.ffn_up.weightQ4_0[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[29568 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 29568]
-
blk.19.ffn_up.weightQ4_0[8192 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[29568 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 29568]
-
blk.20.ffn_up.weightQ4_0[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[29568 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 29568]
-
blk.21.ffn_up.weightQ4_0[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[29568 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 29568]
-
blk.22.ffn_up.weightQ4_0[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[29568 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 29568]
-
blk.23.ffn_up.weightQ4_0[8192 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[29568 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 29568]
-
blk.24.ffn_up.weightQ4_0[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[29568 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 29568]
-
blk.25.ffn_up.weightQ4_0[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[29568 8192]
-
blk.26.ffn_gate.weightQ4_0[8192 29568]
-
blk.26.ffn_up.weightQ4_0[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[29568 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 29568]
-
blk.27.ffn_up.weightQ4_0[8192 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[29568 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 29568]
-
blk.28.ffn_up.weightQ4_0[8192 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[29568 8192]
-
blk.29.ffn_gate.weightQ4_0[8192 29568]
-
blk.29.ffn_up.weightQ4_0[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[29568 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 29568]
-
blk.30.ffn_up.weightQ4_0[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[29568 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 29568]
-
blk.31.ffn_up.weightQ4_0[8192 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[29568 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 29568]
-
blk.32.ffn_up.weightQ4_0[8192 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[29568 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 29568]
-
blk.33.ffn_up.weightQ4_0[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[29568 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 29568]
-
blk.34.ffn_up.weightQ4_0[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[29568 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 29568]
-
blk.35.ffn_up.weightQ4_0[8192 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[29568 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 29568]
-
blk.36.ffn_up.weightQ4_0[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[29568 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 29568]
-
blk.37.ffn_up.weightQ4_0[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[29568 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 29568]
-
blk.38.ffn_up.weightQ4_0[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[29568 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 29568]
-
blk.39.ffn_up.weightQ4_0[8192 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[29568 8192]
-
blk.40.ffn_gate.weightQ4_0[8192 29568]
-
blk.40.ffn_up.weightQ4_0[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[29568 8192]
-
blk.41.ffn_gate.weightQ4_0[8192 29568]
-
blk.41.ffn_up.weightQ4_0[8192 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[29568 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 29568]
-
blk.42.ffn_up.weightQ4_0[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[29568 8192]
-
blk.43.ffn_gate.weightQ4_0[8192 29568]
-
blk.43.ffn_up.weightQ4_0[8192 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[29568 8192]
-
blk.44.ffn_gate.weightQ4_0[8192 29568]
-
blk.44.ffn_up.weightQ4_0[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[29568 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 29568]
-
blk.45.ffn_up.weightQ4_0[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[29568 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 29568]
-
blk.46.ffn_up.weightQ4_0[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[29568 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 29568]
-
blk.47.ffn_up.weightQ4_0[8192 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ4_0[8192 1024]
-
blk.48.attn_output.weightQ4_0[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightQ4_0[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_0[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_0[29568 8192]
-
blk.48.ffn_gate.weightQ4_0[8192 29568]
-
blk.48.ffn_up.weightQ4_0[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ4_0[8192 1024]
-
blk.49.attn_output.weightQ4_0[8192 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightQ4_0[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_0[29568 8192]
-
blk.49.ffn_gate.weightQ4_0[8192 29568]
-
blk.49.ffn_up.weightQ4_0[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ4_0[8192 1024]
-
blk.50.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightQ4_0[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_0[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ4_0[29568 8192]
-
blk.50.ffn_gate.weightQ4_0[8192 29568]
-
blk.50.ffn_up.weightQ4_0[8192 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ4_0[8192 1024]
-
blk.51.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightQ4_0[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_0[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_0[29568 8192]
-
blk.51.ffn_gate.weightQ4_0[8192 29568]
-
blk.51.ffn_up.weightQ4_0[8192 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ4_0[8192 1024]
-
blk.52.attn_output.weightQ4_0[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightQ4_0[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_0[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_0[29568 8192]
-
blk.52.ffn_gate.weightQ4_0[8192 29568]
-
blk.52.ffn_up.weightQ4_0[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ4_0[8192 1024]
-
blk.53.attn_output.weightQ4_0[8192 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightQ4_0[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_0[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_0[29568 8192]
-
blk.53.ffn_gate.weightQ4_0[8192 29568]
-
blk.53.ffn_up.weightQ4_0[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ4_0[8192 1024]
-
blk.54.attn_output.weightQ4_0[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightQ4_0[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_0[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ4_0[29568 8192]
-
blk.54.ffn_gate.weightQ4_0[8192 29568]
-
blk.54.ffn_up.weightQ4_0[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ4_0[8192 1024]
-
blk.55.attn_output.weightQ4_0[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightQ4_0[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_0[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_0[29568 8192]
-
blk.55.ffn_gate.weightQ4_0[8192 29568]
-
blk.55.ffn_up.weightQ4_0[8192 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ4_0[8192 1024]
-
blk.56.attn_output.weightQ4_0[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightQ4_0[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_0[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ4_0[29568 8192]
-
blk.56.ffn_gate.weightQ4_0[8192 29568]
-
blk.56.ffn_up.weightQ4_0[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ4_0[8192 1024]
-
blk.57.attn_output.weightQ4_0[8192 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightQ4_0[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_0[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ4_0[29568 8192]
-
blk.57.ffn_gate.weightQ4_0[8192 29568]
-
blk.57.ffn_up.weightQ4_0[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ4_0[8192 1024]
-
blk.58.attn_output.weightQ4_0[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightQ4_0[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_0[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_0[29568 8192]
-
blk.58.ffn_gate.weightQ4_0[8192 29568]
-
blk.58.ffn_up.weightQ4_0[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ4_0[8192 1024]
-
blk.59.attn_output.weightQ4_0[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightQ4_0[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_0[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_0[29568 8192]
-
blk.59.ffn_gate.weightQ4_0[8192 29568]
-
blk.59.ffn_up.weightQ4_0[8192 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ4_0[8192 1024]
-
blk.60.attn_output.weightQ4_0[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightQ4_0[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_0[29568 8192]
-
blk.60.ffn_gate.weightQ4_0[8192 29568]
-
blk.60.ffn_up.weightQ4_0[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ4_0[8192 1024]
-
blk.61.attn_output.weightQ4_0[8192 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightQ4_0[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_0[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_0[29568 8192]
-
blk.61.ffn_gate.weightQ4_0[8192 29568]
-
blk.61.ffn_up.weightQ4_0[8192 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ4_0[8192 1024]
-
blk.62.attn_output.weightQ4_0[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightQ4_0[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_0[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_0[29568 8192]
-
blk.62.ffn_gate.weightQ4_0[8192 29568]
-
blk.62.ffn_up.weightQ4_0[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ4_0[8192 1024]
-
blk.63.attn_output.weightQ4_0[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightQ4_0[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_0[29568 8192]
-
blk.63.ffn_gate.weightQ4_0[8192 29568]
-
blk.63.ffn_up.weightQ4_0[8192 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightQ4_0[8192 1024]
-
blk.64.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightQ4_0[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ4_0[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_0[29568 8192]
-
blk.64.ffn_gate.weightQ4_0[8192 29568]
-
blk.64.ffn_up.weightQ4_0[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightQ4_0[8192 1024]
-
blk.65.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightQ4_0[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ4_0[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_0[29568 8192]
-
blk.65.ffn_gate.weightQ4_0[8192 29568]
-
blk.65.ffn_up.weightQ4_0[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightQ4_0[8192 1024]
-
blk.66.attn_output.weightQ4_0[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightQ4_0[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ4_0[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_0[29568 8192]
-
blk.66.ffn_gate.weightQ4_0[8192 29568]
-
blk.66.ffn_up.weightQ4_0[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightQ4_0[8192 1024]
-
blk.67.attn_output.weightQ4_0[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightQ4_0[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ4_0[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_0[29568 8192]
-
blk.67.ffn_gate.weightQ4_0[8192 29568]
-
blk.67.ffn_up.weightQ4_0[8192 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightQ4_0[8192 1024]
-
blk.68.attn_output.weightQ4_0[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightQ4_0[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ4_0[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_0[29568 8192]
-
blk.68.ffn_gate.weightQ4_0[8192 29568]
-
blk.68.ffn_up.weightQ4_0[8192 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightQ4_0[8192 1024]
-
blk.69.attn_output.weightQ4_0[8192 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightQ4_0[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ4_0[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_0[29568 8192]
-
blk.69.ffn_gate.weightQ4_0[8192 29568]
-
blk.69.ffn_up.weightQ4_0[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightQ4_0[8192 1024]
-
blk.70.attn_output.weightQ4_0[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightQ4_0[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ4_0[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ4_0[29568 8192]
-
blk.70.ffn_gate.weightQ4_0[8192 29568]
-
blk.70.ffn_up.weightQ4_0[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightQ4_0[8192 1024]
-
blk.71.attn_output.weightQ4_0[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightQ4_0[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ4_0[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_0[29568 8192]
-
blk.71.ffn_gate.weightQ4_0[8192 29568]
-
blk.71.ffn_up.weightQ4_0[8192 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightQ4_0[8192 1024]
-
blk.72.attn_output.weightQ4_0[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightQ4_0[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ4_0[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_0[29568 8192]
-
blk.72.ffn_gate.weightQ4_0[8192 29568]
-
blk.72.ffn_up.weightQ4_0[8192 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightQ4_0[8192 1024]
-
blk.73.attn_output.weightQ4_0[8192 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightQ4_0[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ4_0[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ4_0[29568 8192]
-
blk.73.ffn_gate.weightQ4_0[8192 29568]
-
blk.73.ffn_up.weightQ4_0[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightQ4_0[8192 1024]
-
blk.74.attn_output.weightQ4_0[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightQ4_0[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_0[29568 8192]
-
blk.74.ffn_gate.weightQ4_0[8192 29568]
-
blk.74.ffn_up.weightQ4_0[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightQ4_0[8192 1024]
-
blk.75.attn_output.weightQ4_0[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightQ4_0[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ4_0[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_0[29568 8192]
-
blk.75.ffn_gate.weightQ4_0[8192 29568]
-
blk.75.ffn_up.weightQ4_0[8192 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightQ4_0[8192 1024]
-
blk.76.attn_output.weightQ4_0[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightQ4_0[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ4_0[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ4_0[29568 8192]
-
blk.76.ffn_gate.weightQ4_0[8192 29568]
-
blk.76.ffn_up.weightQ4_0[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightQ4_0[8192 1024]
-
blk.77.attn_output.weightQ4_0[8192 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightQ4_0[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_0[29568 8192]
-
blk.77.ffn_gate.weightQ4_0[8192 29568]
-
blk.77.ffn_up.weightQ4_0[8192 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightQ4_0[8192 1024]
-
blk.78.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightQ4_0[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ4_0[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_0[29568 8192]
-
blk.78.ffn_gate.weightQ4_0[8192 29568]
-
blk.78.ffn_up.weightQ4_0[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightQ4_0[8192 1024]
-
blk.79.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightQ4_0[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ4_0[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_0[29568 8192]
-
blk.79.ffn_gate.weightQ4_0[8192 29568]
-
blk.79.ffn_up.weightQ4_0[8192 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
output.weightQ6_K[8192 152064]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79