An experimental model for my own personal uses.
Tools
8B
9B
171 Pulls Updated 7 weeks ago
e84ed7399c82 · 5.5GB
-
general.architecturegemma2
-
general.file_typeQ4_0
-
gemma2.attention.head_count16
-
gemma2.attention.head_count_kv8
-
gemma2.attention.key_length256
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.value_length256
-
gemma2.block_count42
-
gemma2.context_length8192
-
gemma2.embedding_length3584
-
gemma2.feed_forward_length14336
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_padding_tokenfalse
-
tokenizer.ggml.add_unknown_tokenfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.eot_token_id107
-
tokenizer.ggml.merges[ ...]
-
tokenizer.ggml.middle_token_id68
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.prefix_token_id67
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.suffix_token_id69
-
tokenizer.ggml.token_type[3 3 3 2 1 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[3584 256000]
-
blk.0.attn_norm.weightF32[3584]
-
blk.0.ffn_down.weightQ4_0[14336 3584]
-
blk.0.ffn_gate.weightQ4_0[3584 14336]
-
blk.0.ffn_up.weightQ4_0[3584 14336]
-
blk.0.post_attention_norm.weightF32[3584]
-
blk.0.post_ffw_norm.weightF32[3584]
-
blk.0.ffn_norm.weightF32[3584]
-
blk.0.attn_k.weightQ4_0[3584 2048]
-
blk.0.attn_output.weightQ4_0[4096 3584]
-
blk.0.attn_q.weightQ4_0[3584 4096]
-
blk.0.attn_v.weightQ4_0[3584 2048]
-
blk.1.attn_norm.weightF32[3584]
-
blk.1.ffn_down.weightQ4_0[14336 3584]
-
blk.1.ffn_gate.weightQ4_0[3584 14336]
-
blk.1.ffn_up.weightQ4_0[3584 14336]
-
blk.1.post_attention_norm.weightF32[3584]
-
blk.1.post_ffw_norm.weightF32[3584]
-
blk.1.ffn_norm.weightF32[3584]
-
blk.1.attn_k.weightQ4_0[3584 2048]
-
blk.1.attn_output.weightQ4_0[4096 3584]
-
blk.1.attn_q.weightQ4_0[3584 4096]
-
blk.1.attn_v.weightQ4_0[3584 2048]
-
blk.2.attn_v.weightQ4_0[3584 2048]
-
blk.2.ffn_down.weightQ4_0[14336 3584]
-
blk.2.ffn_gate.weightQ4_0[3584 14336]
-
blk.2.ffn_up.weightQ4_0[3584 14336]
-
blk.2.post_attention_norm.weightF32[3584]
-
blk.2.post_ffw_norm.weightF32[3584]
-
blk.2.ffn_norm.weightF32[3584]
-
blk.2.attn_k.weightQ4_0[3584 2048]
-
blk.2.attn_output.weightQ4_0[4096 3584]
-
blk.2.attn_q.weightQ4_0[3584 4096]
-
blk.2.attn_norm.weightF32[3584]
-
blk.3.attn_v.weightQ4_0[3584 2048]
-
blk.3.ffn_down.weightQ4_0[14336 3584]
-
blk.3.ffn_gate.weightQ4_0[3584 14336]
-
blk.3.ffn_up.weightQ4_0[3584 14336]
-
blk.3.post_attention_norm.weightF32[3584]
-
blk.3.post_ffw_norm.weightF32[3584]
-
blk.3.ffn_norm.weightF32[3584]
-
blk.3.attn_k.weightQ4_0[3584 2048]
-
blk.3.attn_output.weightQ4_0[4096 3584]
-
blk.3.attn_q.weightQ4_0[3584 4096]
-
blk.3.attn_norm.weightF32[3584]
-
blk.4.ffn_norm.weightF32[3584]
-
blk.4.ffn_down.weightQ4_0[14336 3584]
-
blk.4.ffn_gate.weightQ4_0[3584 14336]
-
blk.4.ffn_up.weightQ4_0[3584 14336]
-
blk.4.post_attention_norm.weightF32[3584]
-
blk.4.post_ffw_norm.weightF32[3584]
-
blk.4.attn_norm.weightF32[3584]
-
blk.4.attn_k.weightQ4_0[3584 2048]
-
blk.4.attn_output.weightQ4_0[4096 3584]
-
blk.4.attn_q.weightQ4_0[3584 4096]
-
blk.4.attn_v.weightQ4_0[3584 2048]
-
blk.5.attn_norm.weightF32[3584]
-
blk.5.ffn_down.weightQ4_0[14336 3584]
-
blk.5.ffn_gate.weightQ4_0[3584 14336]
-
blk.5.ffn_up.weightQ4_0[3584 14336]
-
blk.5.post_attention_norm.weightF32[3584]
-
blk.5.post_ffw_norm.weightF32[3584]
-
blk.5.ffn_norm.weightF32[3584]
-
blk.5.attn_k.weightQ4_0[3584 2048]
-
blk.5.attn_output.weightQ4_0[4096 3584]
-
blk.5.attn_q.weightQ4_0[3584 4096]
-
blk.5.attn_v.weightQ4_0[3584 2048]
-
blk.6.attn_norm.weightF32[3584]
-
blk.6.ffn_down.weightQ4_0[14336 3584]
-
blk.6.ffn_gate.weightQ4_0[3584 14336]
-
blk.6.ffn_up.weightQ4_0[3584 14336]
-
blk.6.post_attention_norm.weightF32[3584]
-
blk.6.post_ffw_norm.weightF32[3584]
-
blk.6.ffn_norm.weightF32[3584]
-
blk.6.attn_k.weightQ4_0[3584 2048]
-
blk.6.attn_output.weightQ4_0[4096 3584]
-
blk.6.attn_q.weightQ4_0[3584 4096]
-
blk.6.attn_v.weightQ4_0[3584 2048]
-
blk.7.attn_norm.weightF32[3584]
-
blk.7.ffn_up.weightQ4_0[3584 14336]
-
blk.7.attn_k.weightQ4_0[3584 2048]
-
blk.7.attn_output.weightQ4_0[4096 3584]
-
blk.7.attn_q.weightQ4_0[3584 4096]
-
blk.7.attn_v.weightQ4_0[3584 2048]
-
blk.7.ffn_gate.weightQ4_0[3584 14336]
-
blk.7.ffn_down.weightQ4_0[14336 3584]
-
blk.7.post_attention_norm.weightF32[3584]
-
blk.7.post_ffw_norm.weightF32[3584]
-
blk.7.ffn_norm.weightF32[3584]
-
blk.8.attn_norm.weightF32[3584]
-
blk.8.ffn_down.weightQ4_0[14336 3584]
-
blk.8.ffn_gate.weightQ4_0[3584 14336]
-
blk.8.ffn_up.weightQ4_0[3584 14336]
-
blk.8.post_ffw_norm.weightF32[3584]
-
blk.8.ffn_norm.weightF32[3584]
-
blk.8.attn_k.weightQ4_0[3584 2048]
-
blk.8.attn_output.weightQ4_0[4096 3584]
-
blk.8.attn_q.weightQ4_0[3584 4096]
-
blk.8.attn_v.weightQ4_0[3584 2048]
-
blk.8.post_attention_norm.weightF32[3584]
-
blk.9.attn_v.weightQ4_0[3584 2048]
-
blk.9.ffn_down.weightQ4_0[14336 3584]
-
blk.9.attn_norm.weightF32[3584]
-
blk.9.ffn_gate.weightQ4_0[3584 14336]
-
blk.9.ffn_up.weightQ4_0[3584 14336]
-
blk.9.post_attention_norm.weightF32[3584]
-
blk.9.post_ffw_norm.weightF32[3584]
-
blk.9.ffn_norm.weightF32[3584]
-
blk.9.attn_k.weightQ4_0[3584 2048]
-
blk.9.attn_output.weightQ4_0[4096 3584]
-
blk.9.attn_q.weightQ4_0[3584 4096]
-
blk.10.attn_q.weightQ4_0[3584 4096]
-
blk.10.attn_v.weightQ4_0[3584 2048]
-
blk.10.ffn_down.weightQ4_0[14336 3584]
-
blk.10.ffn_gate.weightQ4_0[3584 14336]
-
blk.10.attn_k.weightQ4_0[3584 2048]
-
blk.10.ffn_norm.weightF32[3584]
-
blk.10.ffn_up.weightQ4_0[3584 14336]
-
blk.10.post_attention_norm.weightF32[3584]
-
blk.10.post_ffw_norm.weightF32[3584]
-
blk.10.attn_output.weightQ4_0[4096 3584]
-
blk.10.attn_norm.weightF32[3584]
-
blk.11.ffn_norm.weightF32[3584]
-
blk.11.post_attention_norm.weightF32[3584]
-
blk.11.attn_q.weightQ4_0[3584 4096]
-
blk.11.ffn_up.weightQ4_0[3584 14336]
-
blk.11.attn_k.weightQ4_0[3584 2048]
-
blk.11.attn_norm.weightF32[3584]
-
blk.11.post_ffw_norm.weightF32[3584]
-
blk.11.attn_output.weightQ4_0[4096 3584]
-
blk.11.attn_v.weightQ4_0[3584 2048]
-
blk.11.ffn_down.weightQ4_0[14336 3584]
-
blk.11.ffn_gate.weightQ4_0[3584 14336]
-
blk.12.attn_norm.weightF32[3584]
-
blk.12.ffn_down.weightQ4_0[14336 3584]
-
blk.12.attn_v.weightQ4_0[3584 2048]
-
blk.12.attn_q.weightQ4_0[3584 4096]
-
blk.12.attn_output.weightQ4_0[4096 3584]
-
blk.12.attn_k.weightQ4_0[3584 2048]
-
blk.12.ffn_norm.weightF32[3584]
-
blk.12.post_ffw_norm.weightF32[3584]
-
blk.12.post_attention_norm.weightF32[3584]
-
blk.12.ffn_up.weightQ4_0[3584 14336]
-
blk.12.ffn_gate.weightQ4_0[3584 14336]
-
blk.13.attn_output.weightQ4_0[4096 3584]
-
blk.13.attn_v.weightQ4_0[3584 2048]
-
blk.13.ffn_norm.weightF32[3584]
-
blk.13.post_ffw_norm.weightF32[3584]
-
blk.13.post_attention_norm.weightF32[3584]
-
blk.13.ffn_up.weightQ4_0[3584 14336]
-
blk.13.ffn_gate.weightQ4_0[3584 14336]
-
blk.13.ffn_down.weightQ4_0[14336 3584]
-
blk.13.attn_norm.weightF32[3584]
-
blk.13.attn_k.weightQ4_0[3584 2048]
-
blk.13.attn_q.weightQ4_0[3584 4096]
-
blk.14.post_ffw_norm.weightF32[3584]
-
blk.14.attn_norm.weightF32[3584]
-
blk.14.ffn_down.weightQ4_0[14336 3584]
-
blk.14.ffn_gate.weightQ4_0[3584 14336]
-
blk.14.ffn_up.weightQ4_0[3584 14336]
-
blk.14.post_attention_norm.weightF32[3584]
-
blk.14.attn_output.weightQ4_0[4096 3584]
-
blk.14.ffn_norm.weightF32[3584]
-
blk.14.attn_k.weightQ4_0[3584 2048]
-
blk.14.attn_v.weightQ4_0[3584 2048]
-
blk.14.attn_q.weightQ4_0[3584 4096]
-
blk.15.attn_v.weightQ4_0[3584 2048]
-
blk.15.attn_q.weightQ4_0[3584 4096]
-
blk.15.attn_norm.weightF32[3584]
-
blk.15.ffn_down.weightQ4_0[14336 3584]
-
blk.15.ffn_gate.weightQ4_0[3584 14336]
-
blk.15.ffn_up.weightQ4_0[3584 14336]
-
blk.15.post_attention_norm.weightF32[3584]
-
blk.15.post_ffw_norm.weightF32[3584]
-
blk.15.ffn_norm.weightF32[3584]
-
blk.15.attn_k.weightQ4_0[3584 2048]
-
blk.15.attn_output.weightQ4_0[4096 3584]
-
blk.16.ffn_norm.weightF32[3584]
-
blk.16.attn_norm.weightF32[3584]
-
blk.16.attn_k.weightQ4_0[3584 2048]
-
blk.16.post_ffw_norm.weightF32[3584]
-
blk.16.attn_q.weightQ4_0[3584 4096]
-
blk.16.attn_v.weightQ4_0[3584 2048]
-
blk.16.attn_output.weightQ4_0[4096 3584]
-
blk.16.post_attention_norm.weightF32[3584]
-
blk.16.ffn_up.weightQ4_0[3584 14336]
-
blk.16.ffn_gate.weightQ4_0[3584 14336]
-
blk.16.ffn_down.weightQ4_0[14336 3584]
-
blk.17.attn_norm.weightF32[3584]
-
blk.17.ffn_norm.weightF32[3584]
-
blk.17.attn_k.weightQ4_0[3584 2048]
-
blk.17.attn_output.weightQ4_0[4096 3584]
-
blk.17.post_ffw_norm.weightF32[3584]
-
blk.17.post_attention_norm.weightF32[3584]
-
blk.17.ffn_up.weightQ4_0[3584 14336]
-
blk.17.ffn_gate.weightQ4_0[3584 14336]
-
blk.17.ffn_down.weightQ4_0[14336 3584]
-
blk.17.attn_v.weightQ4_0[3584 2048]
-
blk.17.attn_q.weightQ4_0[3584 4096]
-
blk.18.attn_v.weightQ4_0[3584 2048]
-
blk.18.post_ffw_norm.weightF32[3584]
-
blk.18.attn_norm.weightF32[3584]
-
blk.18.ffn_down.weightQ4_0[14336 3584]
-
blk.18.ffn_gate.weightQ4_0[3584 14336]
-
blk.18.ffn_up.weightQ4_0[3584 14336]
-
blk.18.post_attention_norm.weightF32[3584]
-
blk.18.attn_q.weightQ4_0[3584 4096]
-
blk.18.attn_output.weightQ4_0[4096 3584]
-
blk.18.attn_k.weightQ4_0[3584 2048]
-
blk.18.ffn_norm.weightF32[3584]
-
blk.19.ffn_norm.weightF32[3584]
-
blk.19.attn_norm.weightF32[3584]
-
blk.19.ffn_down.weightQ4_0[14336 3584]
-
blk.19.ffn_gate.weightQ4_0[3584 14336]
-
blk.19.ffn_up.weightQ4_0[3584 14336]
-
blk.19.post_attention_norm.weightF32[3584]
-
blk.19.post_ffw_norm.weightF32[3584]
-
blk.19.attn_k.weightQ4_0[3584 2048]
-
blk.19.attn_output.weightQ4_0[4096 3584]
-
blk.19.attn_q.weightQ4_0[3584 4096]
-
blk.19.attn_v.weightQ4_0[3584 2048]
-
blk.20.attn_k.weightQ4_0[3584 2048]
-
blk.20.attn_output.weightQ4_0[4096 3584]
-
blk.20.attn_q.weightQ4_0[3584 4096]
-
blk.20.attn_v.weightQ4_0[3584 2048]
-
blk.20.attn_norm.weightF32[3584]
-
blk.20.ffn_down.weightQ4_0[14336 3584]
-
blk.20.ffn_gate.weightQ4_0[3584 14336]
-
blk.20.ffn_up.weightQ4_0[3584 14336]
-
blk.20.post_attention_norm.weightF32[3584]
-
blk.20.post_ffw_norm.weightF32[3584]
-
blk.20.ffn_norm.weightF32[3584]
-
blk.21.ffn_down.weightQ4_0[14336 3584]
-
blk.21.attn_norm.weightF32[3584]
-
blk.21.ffn_gate.weightQ4_0[3584 14336]
-
blk.21.ffn_up.weightQ4_0[3584 14336]
-
blk.21.post_attention_norm.weightF32[3584]
-
blk.21.post_ffw_norm.weightF32[3584]
-
blk.21.ffn_norm.weightF32[3584]
-
blk.21.attn_k.weightQ4_0[3584 2048]
-
blk.21.attn_output.weightQ4_0[4096 3584]
-
blk.21.attn_q.weightQ4_0[3584 4096]
-
blk.21.attn_v.weightQ4_0[3584 2048]
-
blk.22.attn_norm.weightF32[3584]
-
blk.22.ffn_down.weightQ4_0[14336 3584]
-
blk.22.ffn_gate.weightQ4_0[3584 14336]
-
blk.22.ffn_up.weightQ4_0[3584 14336]
-
blk.22.post_attention_norm.weightF32[3584]
-
blk.22.post_ffw_norm.weightF32[3584]
-
blk.22.ffn_norm.weightF32[3584]
-
blk.22.attn_k.weightQ4_0[3584 2048]
-
blk.22.attn_output.weightQ4_0[4096 3584]
-
blk.22.attn_q.weightQ4_0[3584 4096]
-
blk.22.attn_v.weightQ4_0[3584 2048]
-
blk.23.attn_norm.weightF32[3584]
-
blk.23.ffn_down.weightQ4_0[14336 3584]
-
blk.23.ffn_gate.weightQ4_0[3584 14336]
-
blk.23.ffn_up.weightQ4_0[3584 14336]
-
blk.23.post_attention_norm.weightF32[3584]
-
blk.23.post_ffw_norm.weightF32[3584]
-
blk.23.ffn_norm.weightF32[3584]
-
blk.23.attn_k.weightQ4_0[3584 2048]
-
blk.23.attn_output.weightQ4_0[4096 3584]
-
blk.23.attn_q.weightQ4_0[3584 4096]
-
blk.23.attn_v.weightQ4_0[3584 2048]
-
blk.24.attn_norm.weightF32[3584]
-
blk.24.ffn_down.weightQ4_0[14336 3584]
-
blk.24.ffn_gate.weightQ4_0[3584 14336]
-
blk.24.ffn_up.weightQ4_0[3584 14336]
-
blk.24.post_attention_norm.weightF32[3584]
-
blk.24.post_ffw_norm.weightF32[3584]
-
blk.24.ffn_norm.weightF32[3584]
-
blk.24.attn_k.weightQ4_0[3584 2048]
-
blk.24.attn_output.weightQ4_0[4096 3584]
-
blk.24.attn_q.weightQ4_0[3584 4096]
-
blk.24.attn_v.weightQ4_0[3584 2048]
-
blk.25.attn_norm.weightF32[3584]
-
blk.25.ffn_down.weightQ4_0[14336 3584]
-
blk.25.ffn_gate.weightQ4_0[3584 14336]
-
blk.25.ffn_up.weightQ4_0[3584 14336]
-
blk.25.post_attention_norm.weightF32[3584]
-
blk.25.post_ffw_norm.weightF32[3584]
-
blk.25.ffn_norm.weightF32[3584]
-
blk.25.attn_k.weightQ4_0[3584 2048]
-
blk.25.attn_output.weightQ4_0[4096 3584]
-
blk.25.attn_q.weightQ4_0[3584 4096]
-
blk.25.attn_v.weightQ4_0[3584 2048]
-
blk.26.attn_norm.weightF32[3584]
-
blk.26.ffn_down.weightQ4_0[14336 3584]
-
blk.26.ffn_gate.weightQ4_0[3584 14336]
-
blk.26.ffn_up.weightQ4_0[3584 14336]
-
blk.26.post_attention_norm.weightF32[3584]
-
blk.26.post_ffw_norm.weightF32[3584]
-
blk.26.ffn_norm.weightF32[3584]
-
blk.26.attn_k.weightQ4_0[3584 2048]
-
blk.26.attn_output.weightQ4_0[4096 3584]
-
blk.26.attn_q.weightQ4_0[3584 4096]
-
blk.26.attn_v.weightQ4_0[3584 2048]
-
blk.27.attn_norm.weightF32[3584]
-
blk.27.ffn_down.weightQ4_0[14336 3584]
-
blk.27.ffn_gate.weightQ4_0[3584 14336]
-
blk.27.ffn_up.weightQ4_0[3584 14336]
-
blk.27.post_attention_norm.weightF32[3584]
-
blk.27.post_ffw_norm.weightF32[3584]
-
blk.27.ffn_norm.weightF32[3584]
-
blk.27.attn_k.weightQ4_0[3584 2048]
-
blk.27.attn_output.weightQ4_0[4096 3584]
-
blk.27.attn_q.weightQ4_0[3584 4096]
-
blk.27.attn_v.weightQ4_0[3584 2048]
-
blk.28.attn_norm.weightF32[3584]
-
blk.28.ffn_down.weightQ4_0[14336 3584]
-
blk.28.ffn_gate.weightQ4_0[3584 14336]
-
blk.28.ffn_up.weightQ4_0[3584 14336]
-
blk.28.post_attention_norm.weightF32[3584]
-
blk.28.post_ffw_norm.weightF32[3584]
-
blk.28.ffn_norm.weightF32[3584]
-
blk.28.attn_k.weightQ4_0[3584 2048]
-
blk.28.attn_output.weightQ4_0[4096 3584]
-
blk.28.attn_q.weightQ4_0[3584 4096]
-
blk.28.attn_v.weightQ4_0[3584 2048]
-
blk.29.attn_norm.weightF32[3584]
-
blk.29.ffn_down.weightQ4_0[14336 3584]
-
blk.29.ffn_gate.weightQ4_0[3584 14336]
-
blk.29.ffn_up.weightQ4_0[3584 14336]
-
blk.29.post_attention_norm.weightF32[3584]
-
blk.29.post_ffw_norm.weightF32[3584]
-
blk.29.ffn_norm.weightF32[3584]
-
blk.29.attn_k.weightQ4_0[3584 2048]
-
blk.29.attn_output.weightQ4_0[4096 3584]
-
blk.29.attn_q.weightQ4_0[3584 4096]
-
blk.29.attn_v.weightQ4_0[3584 2048]
-
blk.30.attn_norm.weightF32[3584]
-
blk.30.ffn_down.weightQ4_0[14336 3584]
-
blk.30.ffn_gate.weightQ4_0[3584 14336]
-
blk.30.ffn_up.weightQ4_0[3584 14336]
-
blk.30.post_attention_norm.weightF32[3584]
-
blk.30.post_ffw_norm.weightF32[3584]
-
blk.30.ffn_norm.weightF32[3584]
-
blk.30.attn_k.weightQ4_0[3584 2048]
-
blk.30.attn_output.weightQ4_0[4096 3584]
-
blk.30.attn_q.weightQ4_0[3584 4096]
-
blk.30.attn_v.weightQ4_0[3584 2048]
-
blk.31.attn_k.weightQ4_0[3584 2048]
-
blk.31.ffn_down.weightQ4_0[14336 3584]
-
blk.31.ffn_gate.weightQ4_0[3584 14336]
-
blk.31.ffn_up.weightQ4_0[3584 14336]
-
blk.31.post_attention_norm.weightF32[3584]
-
blk.31.post_ffw_norm.weightF32[3584]
-
blk.31.ffn_norm.weightF32[3584]
-
blk.31.attn_norm.weightF32[3584]
-
blk.31.attn_output.weightQ4_0[4096 3584]
-
blk.31.attn_q.weightQ4_0[3584 4096]
-
blk.31.attn_v.weightQ4_0[3584 2048]
-
blk.32.ffn_gate.weightQ4_0[3584 14336]
-
blk.32.ffn_up.weightQ4_0[3584 14336]
-
blk.32.attn_k.weightQ4_0[3584 2048]
-
blk.32.attn_output.weightQ4_0[4096 3584]
-
blk.32.attn_q.weightQ4_0[3584 4096]
-
blk.32.attn_v.weightQ4_0[3584 2048]
-
blk.32.attn_norm.weightF32[3584]
-
blk.32.ffn_down.weightQ4_0[14336 3584]
-
blk.32.post_attention_norm.weightF32[3584]
-
blk.32.post_ffw_norm.weightF32[3584]
-
blk.32.ffn_norm.weightF32[3584]
-
blk.33.attn_norm.weightF32[3584]
-
blk.33.ffn_down.weightQ4_0[14336 3584]
-
blk.33.ffn_gate.weightQ4_0[3584 14336]
-
blk.33.ffn_up.weightQ4_0[3584 14336]
-
blk.33.post_attention_norm.weightF32[3584]
-
blk.33.post_ffw_norm.weightF32[3584]
-
blk.33.ffn_norm.weightF32[3584]
-
blk.33.attn_k.weightQ4_0[3584 2048]
-
blk.33.attn_output.weightQ4_0[4096 3584]
-
blk.33.attn_q.weightQ4_0[3584 4096]
-
blk.33.attn_v.weightQ4_0[3584 2048]
-
blk.34.attn_norm.weightF32[3584]
-
blk.34.ffn_down.weightQ4_0[14336 3584]
-
blk.34.ffn_gate.weightQ4_0[3584 14336]
-
blk.34.ffn_up.weightQ4_0[3584 14336]
-
blk.34.post_attention_norm.weightF32[3584]
-
blk.34.post_ffw_norm.weightF32[3584]
-
blk.34.ffn_norm.weightF32[3584]
-
blk.34.attn_k.weightQ4_0[3584 2048]
-
blk.34.attn_output.weightQ4_0[4096 3584]
-
blk.34.attn_q.weightQ4_0[3584 4096]
-
blk.34.attn_v.weightQ4_0[3584 2048]
-
blk.35.attn_norm.weightF32[3584]
-
blk.35.ffn_down.weightQ4_0[14336 3584]
-
blk.35.ffn_gate.weightQ4_0[3584 14336]
-
blk.35.ffn_up.weightQ4_0[3584 14336]
-
blk.35.post_attention_norm.weightF32[3584]
-
blk.35.post_ffw_norm.weightF32[3584]
-
blk.35.ffn_norm.weightF32[3584]
-
blk.35.attn_k.weightQ4_0[3584 2048]
-
blk.35.attn_output.weightQ4_0[4096 3584]
-
blk.35.attn_q.weightQ4_0[3584 4096]
-
blk.35.attn_v.weightQ4_0[3584 2048]
-
blk.36.ffn_norm.weightF32[3584]
-
blk.36.ffn_down.weightQ4_0[14336 3584]
-
blk.36.ffn_gate.weightQ4_0[3584 14336]
-
blk.36.ffn_up.weightQ4_0[3584 14336]
-
blk.36.post_attention_norm.weightF32[3584]
-
blk.36.post_ffw_norm.weightF32[3584]
-
blk.36.attn_norm.weightF32[3584]
-
blk.36.attn_k.weightQ4_0[3584 2048]
-
blk.36.attn_output.weightQ4_0[4096 3584]
-
blk.36.attn_q.weightQ4_0[3584 4096]
-
blk.36.attn_v.weightQ4_0[3584 2048]
-
blk.37.attn_norm.weightF32[3584]
-
blk.37.ffn_down.weightQ4_0[14336 3584]
-
blk.37.ffn_gate.weightQ4_0[3584 14336]
-
blk.37.ffn_up.weightQ4_0[3584 14336]
-
blk.37.post_attention_norm.weightF32[3584]
-
blk.37.post_ffw_norm.weightF32[3584]
-
blk.37.ffn_norm.weightF32[3584]
-
blk.37.attn_k.weightQ4_0[3584 2048]
-
blk.37.attn_output.weightQ4_0[4096 3584]
-
blk.37.attn_q.weightQ4_0[3584 4096]
-
blk.37.attn_v.weightQ4_0[3584 2048]
-
blk.38.attn_norm.weightF32[3584]
-
blk.38.ffn_down.weightQ4_0[14336 3584]
-
blk.38.ffn_gate.weightQ4_0[3584 14336]
-
blk.38.ffn_up.weightQ4_0[3584 14336]
-
blk.38.post_attention_norm.weightF32[3584]
-
blk.38.post_ffw_norm.weightF32[3584]
-
blk.38.ffn_norm.weightF32[3584]
-
blk.38.attn_k.weightQ4_0[3584 2048]
-
blk.38.attn_output.weightQ4_0[4096 3584]
-
blk.38.attn_q.weightQ4_0[3584 4096]
-
blk.38.attn_v.weightQ4_0[3584 2048]
-
blk.39.attn_norm.weightF32[3584]
-
blk.39.ffn_down.weightQ4_0[14336 3584]
-
blk.39.ffn_gate.weightQ4_0[3584 14336]
-
blk.39.ffn_up.weightQ4_0[3584 14336]
-
blk.39.post_attention_norm.weightF32[3584]
-
blk.39.post_ffw_norm.weightF32[3584]
-
blk.39.ffn_norm.weightF32[3584]
-
blk.39.attn_k.weightQ4_0[3584 2048]
-
blk.39.attn_output.weightQ4_0[4096 3584]
-
blk.39.attn_q.weightQ4_0[3584 4096]
-
blk.39.attn_v.weightQ4_0[3584 2048]
-
blk.40.attn_norm.weightF32[3584]
-
blk.40.ffn_down.weightQ4_0[14336 3584]
-
blk.40.ffn_gate.weightQ4_0[3584 14336]
-
blk.40.ffn_up.weightQ4_0[3584 14336]
-
blk.40.post_attention_norm.weightF32[3584]
-
blk.40.post_ffw_norm.weightF32[3584]
-
blk.40.ffn_norm.weightF32[3584]
-
blk.40.attn_k.weightQ4_0[3584 2048]
-
blk.40.attn_output.weightQ4_0[4096 3584]
-
blk.40.attn_q.weightQ4_0[3584 4096]
-
blk.40.attn_v.weightQ4_0[3584 2048]
-
blk.41.attn_norm.weightF32[3584]
-
blk.41.ffn_down.weightQ4_0[14336 3584]
-
blk.41.ffn_gate.weightQ4_0[3584 14336]
-
blk.41.ffn_up.weightQ4_0[3584 14336]
-
blk.41.post_attention_norm.weightF32[3584]
-
blk.41.post_ffw_norm.weightF32[3584]
-
blk.41.ffn_norm.weightF32[3584]
-
blk.41.attn_k.weightQ4_0[3584 2048]
-
blk.41.attn_output.weightQ4_0[4096 3584]
-
blk.41.attn_q.weightQ4_0[3584 4096]
-
blk.41.attn_v.weightQ4_0[3584 2048]
-
output_norm.weightF32[3584]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41