latest
5.8GB
Quantized version of IlyaGusev/saiga_gemma2_9b created by QuantFactory
9B
11 Pulls Updated 10 days ago
07dca63c396e · 5.8GB
-
general.architecturegemma2
-
general.file_typeQ4_K_M
-
gemma2.attention.head_count16
-
gemma2.attention.head_count_kv8
-
gemma2.attention.key_length256
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length256
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count42
-
gemma2.context_length8192
-
gemma2.embedding_length3584
-
gemma2.feed_forward_length14336
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[3584 256000]
-
blk.0.attn_norm.weightF32[3584]
-
blk.0.ffn_down.weightQ6_K[14336 3584]
-
blk.0.ffn_gate.weightQ4_K[3584 14336]
-
blk.0.ffn_up.weightQ4_K[3584 14336]
-
blk.0.post_attention_norm.weightF32[3584]
-
blk.0.post_ffw_norm.weightF32[3584]
-
blk.0.ffn_norm.weightF32[3584]
-
blk.0.attn_k.weightQ4_K[3584 2048]
-
blk.0.attn_output.weightQ4_K[4096 3584]
-
blk.0.attn_q.weightQ4_K[3584 4096]
-
blk.0.attn_v.weightQ6_K[3584 2048]
-
blk.1.attn_norm.weightF32[3584]
-
blk.1.ffn_down.weightQ6_K[14336 3584]
-
blk.1.ffn_gate.weightQ4_K[3584 14336]
-
blk.1.ffn_up.weightQ4_K[3584 14336]
-
blk.1.post_attention_norm.weightF32[3584]
-
blk.1.post_ffw_norm.weightF32[3584]
-
blk.1.ffn_norm.weightF32[3584]
-
blk.1.attn_k.weightQ4_K[3584 2048]
-
blk.1.attn_output.weightQ4_K[4096 3584]
-
blk.1.attn_q.weightQ4_K[3584 4096]
-
blk.1.attn_v.weightQ6_K[3584 2048]
-
blk.2.attn_norm.weightF32[3584]
-
blk.2.ffn_down.weightQ6_K[14336 3584]
-
blk.2.ffn_gate.weightQ4_K[3584 14336]
-
blk.2.ffn_up.weightQ4_K[3584 14336]
-
blk.2.post_attention_norm.weightF32[3584]
-
blk.2.post_ffw_norm.weightF32[3584]
-
blk.2.ffn_norm.weightF32[3584]
-
blk.2.attn_k.weightQ4_K[3584 2048]
-
blk.2.attn_output.weightQ4_K[4096 3584]
-
blk.2.attn_q.weightQ4_K[3584 4096]
-
blk.2.attn_v.weightQ6_K[3584 2048]
-
blk.3.attn_norm.weightF32[3584]
-
blk.3.ffn_down.weightQ6_K[14336 3584]
-
blk.3.ffn_gate.weightQ4_K[3584 14336]
-
blk.3.ffn_up.weightQ4_K[3584 14336]
-
blk.3.post_attention_norm.weightF32[3584]
-
blk.3.post_ffw_norm.weightF32[3584]
-
blk.3.ffn_norm.weightF32[3584]
-
blk.3.attn_k.weightQ4_K[3584 2048]
-
blk.3.attn_output.weightQ4_K[4096 3584]
-
blk.3.attn_q.weightQ4_K[3584 4096]
-
blk.3.attn_v.weightQ6_K[3584 2048]
-
blk.4.attn_norm.weightF32[3584]
-
blk.4.ffn_down.weightQ6_K[14336 3584]
-
blk.4.ffn_gate.weightQ4_K[3584 14336]
-
blk.4.ffn_up.weightQ4_K[3584 14336]
-
blk.4.post_attention_norm.weightF32[3584]
-
blk.4.post_ffw_norm.weightF32[3584]
-
blk.4.ffn_norm.weightF32[3584]
-
blk.4.attn_k.weightQ4_K[3584 2048]
-
blk.4.attn_output.weightQ4_K[4096 3584]
-
blk.4.attn_q.weightQ4_K[3584 4096]
-
blk.4.attn_v.weightQ6_K[3584 2048]
-
blk.5.attn_norm.weightF32[3584]
-
blk.5.ffn_down.weightQ4_K[14336 3584]
-
blk.5.ffn_gate.weightQ4_K[3584 14336]
-
blk.5.ffn_up.weightQ4_K[3584 14336]
-
blk.5.post_attention_norm.weightF32[3584]
-
blk.5.post_ffw_norm.weightF32[3584]
-
blk.5.ffn_norm.weightF32[3584]
-
blk.5.attn_k.weightQ4_K[3584 2048]
-
blk.5.attn_output.weightQ4_K[4096 3584]
-
blk.5.attn_q.weightQ4_K[3584 4096]
-
blk.5.attn_v.weightQ4_K[3584 2048]
-
blk.6.attn_norm.weightF32[3584]
-
blk.6.ffn_down.weightQ4_K[14336 3584]
-
blk.6.ffn_gate.weightQ4_K[3584 14336]
-
blk.6.ffn_up.weightQ4_K[3584 14336]
-
blk.6.post_attention_norm.weightF32[3584]
-
blk.6.post_ffw_norm.weightF32[3584]
-
blk.6.ffn_norm.weightF32[3584]
-
blk.6.attn_k.weightQ4_K[3584 2048]
-
blk.6.attn_output.weightQ4_K[4096 3584]
-
blk.6.attn_q.weightQ4_K[3584 4096]
-
blk.6.attn_v.weightQ4_K[3584 2048]
-
blk.7.ffn_gate.weightQ4_K[3584 14336]
-
blk.7.ffn_up.weightQ4_K[3584 14336]
-
blk.7.attn_k.weightQ4_K[3584 2048]
-
blk.7.attn_output.weightQ4_K[4096 3584]
-
blk.7.attn_q.weightQ4_K[3584 4096]
-
blk.7.attn_v.weightQ6_K[3584 2048]
-
blk.7.attn_norm.weightF32[3584]
-
blk.7.ffn_down.weightQ4_K[14336 3584]
-
blk.7.post_attention_norm.weightF32[3584]
-
blk.7.post_ffw_norm.weightF32[3584]
-
blk.7.ffn_norm.weightF32[3584]
-
blk.8.attn_norm.weightF32[3584]
-
blk.8.ffn_down.weightQ4_K[14336 3584]
-
blk.8.ffn_gate.weightQ4_K[3584 14336]
-
blk.8.ffn_up.weightQ4_K[3584 14336]
-
blk.8.post_attention_norm.weightF32[3584]
-
blk.8.post_ffw_norm.weightF32[3584]
-
blk.8.ffn_norm.weightF32[3584]
-
blk.8.attn_k.weightQ4_K[3584 2048]
-
blk.8.attn_output.weightQ4_K[4096 3584]
-
blk.8.attn_q.weightQ4_K[3584 4096]
-
blk.8.attn_v.weightQ6_K[3584 2048]
-
blk.9.attn_norm.weightF32[3584]
-
blk.9.ffn_down.weightQ6_K[14336 3584]
-
blk.9.ffn_gate.weightQ4_K[3584 14336]
-
blk.9.ffn_up.weightQ4_K[3584 14336]
-
blk.9.post_attention_norm.weightF32[3584]
-
blk.9.post_ffw_norm.weightF32[3584]
-
blk.9.ffn_norm.weightF32[3584]
-
blk.9.attn_k.weightQ4_K[3584 2048]
-
blk.9.attn_output.weightQ4_K[4096 3584]
-
blk.9.attn_q.weightQ4_K[3584 4096]
-
blk.9.attn_v.weightQ4_K[3584 2048]
-
blk.10.attn_norm.weightF32[3584]
-
blk.10.ffn_down.weightQ6_K[14336 3584]
-
blk.10.ffn_gate.weightQ4_K[3584 14336]
-
blk.10.ffn_up.weightQ4_K[3584 14336]
-
blk.10.post_attention_norm.weightF32[3584]
-
blk.10.post_ffw_norm.weightF32[3584]
-
blk.10.ffn_norm.weightF32[3584]
-
blk.10.attn_k.weightQ4_K[3584 2048]
-
blk.10.attn_output.weightQ4_K[4096 3584]
-
blk.10.attn_q.weightQ4_K[3584 4096]
-
blk.10.attn_v.weightQ4_K[3584 2048]
-
blk.11.attn_norm.weightF32[3584]
-
blk.11.ffn_down.weightQ4_K[14336 3584]
-
blk.11.ffn_gate.weightQ4_K[3584 14336]
-
blk.11.ffn_up.weightQ4_K[3584 14336]
-
blk.11.post_attention_norm.weightF32[3584]
-
blk.11.post_ffw_norm.weightF32[3584]
-
blk.11.ffn_norm.weightF32[3584]
-
blk.11.attn_k.weightQ4_K[3584 2048]
-
blk.11.attn_output.weightQ4_K[4096 3584]
-
blk.11.attn_q.weightQ4_K[3584 4096]
-
blk.11.attn_v.weightQ4_K[3584 2048]
-
blk.12.attn_norm.weightF32[3584]
-
blk.12.ffn_down.weightQ4_K[14336 3584]
-
blk.12.ffn_gate.weightQ4_K[3584 14336]
-
blk.12.ffn_up.weightQ4_K[3584 14336]
-
blk.12.post_attention_norm.weightF32[3584]
-
blk.12.post_ffw_norm.weightF32[3584]
-
blk.12.ffn_norm.weightF32[3584]
-
blk.12.attn_k.weightQ4_K[3584 2048]
-
blk.12.attn_output.weightQ4_K[4096 3584]
-
blk.12.attn_q.weightQ4_K[3584 4096]
-
blk.12.attn_v.weightQ6_K[3584 2048]
-
blk.13.attn_norm.weightF32[3584]
-
blk.13.ffn_down.weightQ6_K[14336 3584]
-
blk.13.ffn_gate.weightQ4_K[3584 14336]
-
blk.13.ffn_up.weightQ4_K[3584 14336]
-
blk.13.post_attention_norm.weightF32[3584]
-
blk.13.post_ffw_norm.weightF32[3584]
-
blk.13.ffn_norm.weightF32[3584]
-
blk.13.attn_k.weightQ4_K[3584 2048]
-
blk.13.attn_output.weightQ4_K[4096 3584]
-
blk.13.attn_q.weightQ4_K[3584 4096]
-
blk.13.attn_v.weightQ4_K[3584 2048]
-
blk.14.attn_norm.weightF32[3584]
-
blk.14.ffn_down.weightQ4_K[14336 3584]
-
blk.14.ffn_gate.weightQ4_K[3584 14336]
-
blk.14.ffn_up.weightQ4_K[3584 14336]
-
blk.14.post_attention_norm.weightF32[3584]
-
blk.14.post_ffw_norm.weightF32[3584]
-
blk.14.ffn_norm.weightF32[3584]
-
blk.14.attn_k.weightQ4_K[3584 2048]
-
blk.14.attn_output.weightQ4_K[4096 3584]
-
blk.14.attn_q.weightQ4_K[3584 4096]
-
blk.14.attn_v.weightQ4_K[3584 2048]
-
blk.15.attn_norm.weightF32[3584]
-
blk.15.ffn_down.weightQ4_K[14336 3584]
-
blk.15.ffn_gate.weightQ4_K[3584 14336]
-
blk.15.ffn_up.weightQ4_K[3584 14336]
-
blk.15.post_attention_norm.weightF32[3584]
-
blk.15.post_ffw_norm.weightF32[3584]
-
blk.15.ffn_norm.weightF32[3584]
-
blk.15.attn_k.weightQ4_K[3584 2048]
-
blk.15.attn_output.weightQ4_K[4096 3584]
-
blk.15.attn_q.weightQ4_K[3584 4096]
-
blk.15.attn_v.weightQ6_K[3584 2048]
-
blk.16.attn_norm.weightF32[3584]
-
blk.16.ffn_down.weightQ6_K[14336 3584]
-
blk.16.ffn_gate.weightQ4_K[3584 14336]
-
blk.16.ffn_up.weightQ4_K[3584 14336]
-
blk.16.post_attention_norm.weightF32[3584]
-
blk.16.post_ffw_norm.weightF32[3584]
-
blk.16.ffn_norm.weightF32[3584]
-
blk.16.attn_k.weightQ4_K[3584 2048]
-
blk.16.attn_output.weightQ4_K[4096 3584]
-
blk.16.attn_q.weightQ4_K[3584 4096]
-
blk.16.attn_v.weightQ4_K[3584 2048]
-
blk.17.attn_norm.weightF32[3584]
-
blk.17.ffn_down.weightQ4_K[14336 3584]
-
blk.17.ffn_gate.weightQ4_K[3584 14336]
-
blk.17.ffn_up.weightQ4_K[3584 14336]
-
blk.17.post_attention_norm.weightF32[3584]
-
blk.17.post_ffw_norm.weightF32[3584]
-
blk.17.ffn_norm.weightF32[3584]
-
blk.17.attn_k.weightQ4_K[3584 2048]
-
blk.17.attn_output.weightQ4_K[4096 3584]
-
blk.17.attn_q.weightQ4_K[3584 4096]
-
blk.17.attn_v.weightQ4_K[3584 2048]
-
blk.18.attn_norm.weightF32[3584]
-
blk.18.ffn_down.weightQ4_K[14336 3584]
-
blk.18.ffn_gate.weightQ4_K[3584 14336]
-
blk.18.ffn_up.weightQ4_K[3584 14336]
-
blk.18.post_attention_norm.weightF32[3584]
-
blk.18.post_ffw_norm.weightF32[3584]
-
blk.18.ffn_norm.weightF32[3584]
-
blk.18.attn_k.weightQ4_K[3584 2048]
-
blk.18.attn_output.weightQ4_K[4096 3584]
-
blk.18.attn_q.weightQ4_K[3584 4096]
-
blk.18.attn_v.weightQ6_K[3584 2048]
-
blk.19.attn_norm.weightF32[3584]
-
blk.19.ffn_down.weightQ6_K[14336 3584]
-
blk.19.ffn_gate.weightQ4_K[3584 14336]
-
blk.19.ffn_up.weightQ4_K[3584 14336]
-
blk.19.post_attention_norm.weightF32[3584]
-
blk.19.post_ffw_norm.weightF32[3584]
-
blk.19.ffn_norm.weightF32[3584]
-
blk.19.attn_k.weightQ4_K[3584 2048]
-
blk.19.attn_output.weightQ4_K[4096 3584]
-
blk.19.attn_q.weightQ4_K[3584 4096]
-
blk.19.attn_v.weightQ4_K[3584 2048]
-
blk.20.attn_k.weightQ4_K[3584 2048]
-
blk.20.attn_output.weightQ4_K[4096 3584]
-
blk.20.attn_q.weightQ4_K[3584 4096]
-
blk.20.attn_v.weightQ4_K[3584 2048]
-
blk.20.attn_norm.weightF32[3584]
-
blk.20.ffn_down.weightQ4_K[14336 3584]
-
blk.20.ffn_gate.weightQ4_K[3584 14336]
-
blk.20.ffn_up.weightQ4_K[3584 14336]
-
blk.20.post_attention_norm.weightF32[3584]
-
blk.20.post_ffw_norm.weightF32[3584]
-
blk.20.ffn_norm.weightF32[3584]
-
blk.21.attn_norm.weightF32[3584]
-
blk.21.ffn_down.weightQ4_K[14336 3584]
-
blk.21.ffn_gate.weightQ4_K[3584 14336]
-
blk.21.ffn_up.weightQ4_K[3584 14336]
-
blk.21.post_attention_norm.weightF32[3584]
-
blk.21.post_ffw_norm.weightF32[3584]
-
blk.21.ffn_norm.weightF32[3584]
-
blk.21.attn_k.weightQ4_K[3584 2048]
-
blk.21.attn_output.weightQ4_K[4096 3584]
-
blk.21.attn_q.weightQ4_K[3584 4096]
-
blk.21.attn_v.weightQ4_K[3584 2048]
-
blk.22.attn_norm.weightF32[3584]
-
blk.22.ffn_down.weightQ6_K[14336 3584]
-
blk.22.ffn_gate.weightQ4_K[3584 14336]
-
blk.22.ffn_up.weightQ4_K[3584 14336]
-
blk.22.post_attention_norm.weightF32[3584]
-
blk.22.post_ffw_norm.weightF32[3584]
-
blk.22.ffn_norm.weightF32[3584]
-
blk.22.attn_k.weightQ4_K[3584 2048]
-
blk.22.attn_output.weightQ4_K[4096 3584]
-
blk.22.attn_q.weightQ4_K[3584 4096]
-
blk.22.attn_v.weightQ6_K[3584 2048]
-
blk.23.attn_norm.weightF32[3584]
-
blk.23.ffn_down.weightQ4_K[14336 3584]
-
blk.23.ffn_gate.weightQ4_K[3584 14336]
-
blk.23.ffn_up.weightQ4_K[3584 14336]
-
blk.23.post_attention_norm.weightF32[3584]
-
blk.23.post_ffw_norm.weightF32[3584]
-
blk.23.ffn_norm.weightF32[3584]
-
blk.23.attn_k.weightQ4_K[3584 2048]
-
blk.23.attn_output.weightQ4_K[4096 3584]
-
blk.23.attn_q.weightQ4_K[3584 4096]
-
blk.23.attn_v.weightQ4_K[3584 2048]
-
blk.24.attn_norm.weightF32[3584]
-
blk.24.ffn_down.weightQ4_K[14336 3584]
-
blk.24.ffn_gate.weightQ4_K[3584 14336]
-
blk.24.ffn_up.weightQ4_K[3584 14336]
-
blk.24.post_attention_norm.weightF32[3584]
-
blk.24.post_ffw_norm.weightF32[3584]
-
blk.24.ffn_norm.weightF32[3584]
-
blk.24.attn_k.weightQ4_K[3584 2048]
-
blk.24.attn_output.weightQ4_K[4096 3584]
-
blk.24.attn_q.weightQ4_K[3584 4096]
-
blk.24.attn_v.weightQ4_K[3584 2048]
-
blk.25.attn_norm.weightF32[3584]
-
blk.25.ffn_down.weightQ6_K[14336 3584]
-
blk.25.ffn_gate.weightQ4_K[3584 14336]
-
blk.25.ffn_up.weightQ4_K[3584 14336]
-
blk.25.post_attention_norm.weightF32[3584]
-
blk.25.post_ffw_norm.weightF32[3584]
-
blk.25.ffn_norm.weightF32[3584]
-
blk.25.attn_k.weightQ4_K[3584 2048]
-
blk.25.attn_output.weightQ4_K[4096 3584]
-
blk.25.attn_q.weightQ4_K[3584 4096]
-
blk.25.attn_v.weightQ6_K[3584 2048]
-
blk.26.attn_norm.weightF32[3584]
-
blk.26.ffn_down.weightQ4_K[14336 3584]
-
blk.26.ffn_gate.weightQ4_K[3584 14336]
-
blk.26.ffn_up.weightQ4_K[3584 14336]
-
blk.26.post_attention_norm.weightF32[3584]
-
blk.26.post_ffw_norm.weightF32[3584]
-
blk.26.ffn_norm.weightF32[3584]
-
blk.26.attn_k.weightQ4_K[3584 2048]
-
blk.26.attn_output.weightQ4_K[4096 3584]
-
blk.26.attn_q.weightQ4_K[3584 4096]
-
blk.26.attn_v.weightQ4_K[3584 2048]
-
blk.27.attn_norm.weightF32[3584]
-
blk.27.ffn_down.weightQ4_K[14336 3584]
-
blk.27.ffn_gate.weightQ4_K[3584 14336]
-
blk.27.ffn_up.weightQ4_K[3584 14336]
-
blk.27.post_attention_norm.weightF32[3584]
-
blk.27.post_ffw_norm.weightF32[3584]
-
blk.27.ffn_norm.weightF32[3584]
-
blk.27.attn_k.weightQ4_K[3584 2048]
-
blk.27.attn_output.weightQ4_K[4096 3584]
-
blk.27.attn_q.weightQ4_K[3584 4096]
-
blk.27.attn_v.weightQ4_K[3584 2048]
-
blk.28.attn_norm.weightF32[3584]
-
blk.28.ffn_down.weightQ6_K[14336 3584]
-
blk.28.ffn_gate.weightQ4_K[3584 14336]
-
blk.28.ffn_up.weightQ4_K[3584 14336]
-
blk.28.post_attention_norm.weightF32[3584]
-
blk.28.post_ffw_norm.weightF32[3584]
-
blk.28.ffn_norm.weightF32[3584]
-
blk.28.attn_k.weightQ4_K[3584 2048]
-
blk.28.attn_output.weightQ4_K[4096 3584]
-
blk.28.attn_q.weightQ4_K[3584 4096]
-
blk.28.attn_v.weightQ6_K[3584 2048]
-
blk.29.attn_norm.weightF32[3584]
-
blk.29.ffn_down.weightQ4_K[14336 3584]
-
blk.29.ffn_gate.weightQ4_K[3584 14336]
-
blk.29.ffn_up.weightQ4_K[3584 14336]
-
blk.29.post_attention_norm.weightF32[3584]
-
blk.29.post_ffw_norm.weightF32[3584]
-
blk.29.ffn_norm.weightF32[3584]
-
blk.29.attn_k.weightQ4_K[3584 2048]
-
blk.29.attn_output.weightQ4_K[4096 3584]
-
blk.29.attn_q.weightQ4_K[3584 4096]
-
blk.29.attn_v.weightQ4_K[3584 2048]
-
blk.30.attn_norm.weightF32[3584]
-
blk.30.ffn_down.weightQ4_K[14336 3584]
-
blk.30.ffn_gate.weightQ4_K[3584 14336]
-
blk.30.ffn_up.weightQ4_K[3584 14336]
-
blk.30.post_attention_norm.weightF32[3584]
-
blk.30.post_ffw_norm.weightF32[3584]
-
blk.30.ffn_norm.weightF32[3584]
-
blk.30.attn_k.weightQ4_K[3584 2048]
-
blk.30.attn_output.weightQ4_K[4096 3584]
-
blk.30.attn_q.weightQ4_K[3584 4096]
-
blk.30.attn_v.weightQ4_K[3584 2048]
-
blk.31.attn_norm.weightF32[3584]
-
blk.31.ffn_down.weightQ6_K[14336 3584]
-
blk.31.ffn_gate.weightQ4_K[3584 14336]
-
blk.31.ffn_up.weightQ4_K[3584 14336]
-
blk.31.post_attention_norm.weightF32[3584]
-
blk.31.post_ffw_norm.weightF32[3584]
-
blk.31.ffn_norm.weightF32[3584]
-
blk.31.attn_k.weightQ4_K[3584 2048]
-
blk.31.attn_output.weightQ4_K[4096 3584]
-
blk.31.attn_q.weightQ4_K[3584 4096]
-
blk.31.attn_v.weightQ6_K[3584 2048]
-
blk.32.ffn_gate.weightQ4_K[3584 14336]
-
blk.32.ffn_up.weightQ4_K[3584 14336]
-
blk.32.attn_k.weightQ4_K[3584 2048]
-
blk.32.attn_output.weightQ4_K[4096 3584]
-
blk.32.attn_q.weightQ4_K[3584 4096]
-
blk.32.attn_v.weightQ4_K[3584 2048]
-
blk.32.attn_norm.weightF32[3584]
-
blk.32.ffn_down.weightQ4_K[14336 3584]
-
blk.32.post_attention_norm.weightF32[3584]
-
blk.32.post_ffw_norm.weightF32[3584]
-
blk.32.ffn_norm.weightF32[3584]
-
blk.33.attn_norm.weightF32[3584]
-
blk.33.ffn_down.weightQ4_K[14336 3584]
-
blk.33.ffn_gate.weightQ4_K[3584 14336]
-
blk.33.ffn_up.weightQ4_K[3584 14336]
-
blk.33.post_attention_norm.weightF32[3584]
-
blk.33.post_ffw_norm.weightF32[3584]
-
blk.33.ffn_norm.weightF32[3584]
-
blk.33.attn_k.weightQ4_K[3584 2048]
-
blk.33.attn_output.weightQ4_K[4096 3584]
-
blk.33.attn_q.weightQ4_K[3584 4096]
-
blk.33.attn_v.weightQ4_K[3584 2048]
-
blk.34.attn_norm.weightF32[3584]
-
blk.34.ffn_down.weightQ6_K[14336 3584]
-
blk.34.ffn_gate.weightQ4_K[3584 14336]
-
blk.34.ffn_up.weightQ4_K[3584 14336]
-
blk.34.post_attention_norm.weightF32[3584]
-
blk.34.post_ffw_norm.weightF32[3584]
-
blk.34.ffn_norm.weightF32[3584]
-
blk.34.attn_k.weightQ4_K[3584 2048]
-
blk.34.attn_output.weightQ4_K[4096 3584]
-
blk.34.attn_q.weightQ4_K[3584 4096]
-
blk.34.attn_v.weightQ6_K[3584 2048]
-
blk.35.attn_norm.weightF32[3584]
-
blk.35.ffn_down.weightQ4_K[14336 3584]
-
blk.35.ffn_gate.weightQ4_K[3584 14336]
-
blk.35.ffn_up.weightQ4_K[3584 14336]
-
blk.35.post_attention_norm.weightF32[3584]
-
blk.35.post_ffw_norm.weightF32[3584]
-
blk.35.ffn_norm.weightF32[3584]
-
blk.35.attn_k.weightQ4_K[3584 2048]
-
blk.35.attn_output.weightQ4_K[4096 3584]
-
blk.35.attn_q.weightQ4_K[3584 4096]
-
blk.35.attn_v.weightQ4_K[3584 2048]
-
blk.36.attn_norm.weightF32[3584]
-
blk.36.ffn_down.weightQ6_K[14336 3584]
-
blk.36.ffn_gate.weightQ4_K[3584 14336]
-
blk.36.ffn_up.weightQ4_K[3584 14336]
-
blk.36.post_attention_norm.weightF32[3584]
-
blk.36.post_ffw_norm.weightF32[3584]
-
blk.36.ffn_norm.weightF32[3584]
-
blk.36.attn_k.weightQ4_K[3584 2048]
-
blk.36.attn_output.weightQ4_K[4096 3584]
-
blk.36.attn_q.weightQ4_K[3584 4096]
-
blk.36.attn_v.weightQ6_K[3584 2048]
-
blk.37.attn_norm.weightF32[3584]
-
blk.37.ffn_down.weightQ6_K[14336 3584]
-
blk.37.ffn_gate.weightQ4_K[3584 14336]
-
blk.37.ffn_up.weightQ4_K[3584 14336]
-
blk.37.post_attention_norm.weightF32[3584]
-
blk.37.post_ffw_norm.weightF32[3584]
-
blk.37.ffn_norm.weightF32[3584]
-
blk.37.attn_k.weightQ4_K[3584 2048]
-
blk.37.attn_output.weightQ4_K[4096 3584]
-
blk.37.attn_q.weightQ4_K[3584 4096]
-
blk.37.attn_v.weightQ6_K[3584 2048]
-
blk.38.attn_norm.weightF32[3584]
-
blk.38.ffn_down.weightQ6_K[14336 3584]
-
blk.38.ffn_gate.weightQ4_K[3584 14336]
-
blk.38.ffn_up.weightQ4_K[3584 14336]
-
blk.38.post_attention_norm.weightF32[3584]
-
blk.38.post_ffw_norm.weightF32[3584]
-
blk.38.ffn_norm.weightF32[3584]
-
blk.38.attn_k.weightQ4_K[3584 2048]
-
blk.38.attn_output.weightQ4_K[4096 3584]
-
blk.38.attn_q.weightQ4_K[3584 4096]
-
blk.38.attn_v.weightQ6_K[3584 2048]
-
blk.39.attn_norm.weightF32[3584]
-
blk.39.ffn_down.weightQ6_K[14336 3584]
-
blk.39.ffn_gate.weightQ4_K[3584 14336]
-
blk.39.ffn_up.weightQ4_K[3584 14336]
-
blk.39.post_attention_norm.weightF32[3584]
-
blk.39.post_ffw_norm.weightF32[3584]
-
blk.39.ffn_norm.weightF32[3584]
-
blk.39.attn_k.weightQ4_K[3584 2048]
-
blk.39.attn_output.weightQ4_K[4096 3584]
-
blk.39.attn_q.weightQ4_K[3584 4096]
-
blk.39.attn_v.weightQ6_K[3584 2048]
-
blk.40.attn_norm.weightF32[3584]
-
blk.40.ffn_down.weightQ6_K[14336 3584]
-
blk.40.ffn_gate.weightQ4_K[3584 14336]
-
blk.40.ffn_up.weightQ4_K[3584 14336]
-
blk.40.post_attention_norm.weightF32[3584]
-
blk.40.post_ffw_norm.weightF32[3584]
-
blk.40.ffn_norm.weightF32[3584]
-
blk.40.attn_k.weightQ4_K[3584 2048]
-
blk.40.attn_output.weightQ4_K[4096 3584]
-
blk.40.attn_q.weightQ4_K[3584 4096]
-
blk.40.attn_v.weightQ6_K[3584 2048]
-
blk.41.attn_norm.weightF32[3584]
-
blk.41.ffn_down.weightQ6_K[14336 3584]
-
blk.41.ffn_gate.weightQ4_K[3584 14336]
-
blk.41.ffn_up.weightQ4_K[3584 14336]
-
blk.41.post_attention_norm.weightF32[3584]
-
blk.41.post_ffw_norm.weightF32[3584]
-
blk.41.ffn_norm.weightF32[3584]
-
blk.41.attn_k.weightQ4_K[3584 2048]
-
blk.41.attn_output.weightQ4_K[4096 3584]
-
blk.41.attn_q.weightQ4_K[3584 4096]
-
blk.41.attn_v.weightQ6_K[3584 2048]
-
output_norm.weightF32[3584]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41