27B
2 Pulls Updated 6 weeks ago
eb310a9bfb8b · 17GB
-
general.architecturegemma2
-
general.file_typeQ4_K_M
-
gemma2.attention.head_count32
-
gemma2.attention.head_count_kv16
-
gemma2.attention.key_length128
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length128
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count46
-
gemma2.context_length8192
-
gemma2.embedding_length4608
-
gemma2.feed_forward_length36864
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[4608 256000]
-
blk.0.attn_k.weightQ4_K[4608 2048]
-
blk.0.attn_norm.weightF32[4608]
-
blk.0.attn_output.weightQ4_K[4096 4608]
-
blk.0.attn_q.weightQ4_K[4608 4096]
-
blk.0.attn_v.weightQ6_K[4608 2048]
-
blk.0.ffn_down.weightQ6_K[36864 4608]
-
blk.0.ffn_gate.weightQ4_K[4608 36864]
-
blk.0.ffn_norm.weightF32[4608]
-
blk.0.ffn_up.weightQ4_K[4608 36864]
-
blk.0.post_attention_norm.weightF32[4608]
-
blk.0.post_ffw_norm.weightF32[4608]
-
blk.1.attn_k.weightQ4_K[4608 2048]
-
blk.1.attn_norm.weightF32[4608]
-
blk.1.attn_output.weightQ4_K[4096 4608]
-
blk.1.attn_q.weightQ4_K[4608 4096]
-
blk.1.attn_v.weightQ6_K[4608 2048]
-
blk.1.ffn_down.weightQ6_K[36864 4608]
-
blk.1.ffn_gate.weightQ4_K[4608 36864]
-
blk.1.ffn_norm.weightF32[4608]
-
blk.1.ffn_up.weightQ4_K[4608 36864]
-
blk.1.post_attention_norm.weightF32[4608]
-
blk.1.post_ffw_norm.weightF32[4608]
-
blk.2.attn_k.weightQ4_K[4608 2048]
-
blk.2.attn_norm.weightF32[4608]
-
blk.2.attn_output.weightQ4_K[4096 4608]
-
blk.2.attn_q.weightQ4_K[4608 4096]
-
blk.2.attn_v.weightQ4_K[4608 2048]
-
blk.2.ffn_down.weightQ4_K[36864 4608]
-
blk.2.ffn_gate.weightQ4_K[4608 36864]
-
blk.2.ffn_norm.weightF32[4608]
-
blk.2.ffn_up.weightQ4_K[4608 36864]
-
blk.2.post_attention_norm.weightF32[4608]
-
blk.2.post_ffw_norm.weightF32[4608]
-
blk.3.attn_k.weightQ4_K[4608 2048]
-
blk.3.attn_norm.weightF32[4608]
-
blk.3.attn_output.weightQ4_K[4096 4608]
-
blk.3.attn_q.weightQ4_K[4608 4096]
-
blk.3.attn_v.weightQ4_K[4608 2048]
-
blk.3.ffn_down.weightQ4_K[36864 4608]
-
blk.3.ffn_gate.weightQ4_K[4608 36864]
-
blk.3.ffn_norm.weightF32[4608]
-
blk.3.ffn_up.weightQ4_K[4608 36864]
-
blk.3.post_attention_norm.weightF32[4608]
-
blk.3.post_ffw_norm.weightF32[4608]
-
blk.4.attn_k.weightQ4_K[4608 2048]
-
blk.4.attn_norm.weightF32[4608]
-
blk.4.attn_output.weightQ4_K[4096 4608]
-
blk.4.attn_q.weightQ4_K[4608 4096]
-
blk.4.attn_v.weightQ6_K[4608 2048]
-
blk.4.ffn_down.weightQ6_K[36864 4608]
-
blk.4.ffn_gate.weightQ4_K[4608 36864]
-
blk.4.ffn_norm.weightF32[4608]
-
blk.4.ffn_up.weightQ4_K[4608 36864]
-
blk.4.post_attention_norm.weightF32[4608]
-
blk.4.post_ffw_norm.weightF32[4608]
-
blk.5.attn_k.weightQ4_K[4608 2048]
-
blk.5.attn_norm.weightF32[4608]
-
blk.5.attn_output.weightQ4_K[4096 4608]
-
blk.5.attn_q.weightQ4_K[4608 4096]
-
blk.5.attn_v.weightQ6_K[4608 2048]
-
blk.5.ffn_down.weightQ6_K[36864 4608]
-
blk.5.ffn_gate.weightQ4_K[4608 36864]
-
blk.5.ffn_norm.weightF32[4608]
-
blk.5.ffn_up.weightQ4_K[4608 36864]
-
blk.5.post_attention_norm.weightF32[4608]
-
blk.5.post_ffw_norm.weightF32[4608]
-
blk.6.attn_k.weightQ4_K[4608 2048]
-
blk.6.attn_norm.weightF32[4608]
-
blk.6.attn_output.weightQ4_K[4096 4608]
-
blk.6.attn_q.weightQ4_K[4608 4096]
-
blk.6.attn_v.weightQ6_K[4608 2048]
-
blk.6.ffn_down.weightQ6_K[36864 4608]
-
blk.6.ffn_gate.weightQ4_K[4608 36864]
-
blk.6.ffn_norm.weightF32[4608]
-
blk.6.ffn_up.weightQ4_K[4608 36864]
-
blk.6.post_attention_norm.weightF32[4608]
-
blk.6.post_ffw_norm.weightF32[4608]
-
blk.7.attn_k.weightQ4_K[4608 2048]
-
blk.7.attn_norm.weightF32[4608]
-
blk.7.attn_output.weightQ4_K[4096 4608]
-
blk.7.attn_q.weightQ4_K[4608 4096]
-
blk.7.attn_v.weightQ6_K[4608 2048]
-
blk.7.ffn_down.weightQ6_K[36864 4608]
-
blk.7.ffn_gate.weightQ4_K[4608 36864]
-
blk.7.ffn_norm.weightF32[4608]
-
blk.7.ffn_up.weightQ4_K[4608 36864]
-
blk.7.post_attention_norm.weightF32[4608]
-
blk.7.post_ffw_norm.weightF32[4608]
-
blk.8.attn_k.weightQ4_K[4608 2048]
-
blk.8.attn_norm.weightF32[4608]
-
blk.8.attn_output.weightQ4_K[4096 4608]
-
blk.8.attn_q.weightQ4_K[4608 4096]
-
blk.8.attn_v.weightQ6_K[4608 2048]
-
blk.8.ffn_down.weightQ6_K[36864 4608]
-
blk.8.ffn_gate.weightQ4_K[4608 36864]
-
blk.8.ffn_norm.weightF32[4608]
-
blk.8.ffn_up.weightQ4_K[4608 36864]
-
blk.8.post_attention_norm.weightF32[4608]
-
blk.8.post_ffw_norm.weightF32[4608]
-
blk.9.attn_k.weightQ4_K[4608 2048]
-
blk.9.attn_norm.weightF32[4608]
-
blk.9.attn_output.weightQ4_K[4096 4608]
-
blk.9.attn_q.weightQ4_K[4608 4096]
-
blk.9.attn_v.weightQ6_K[4608 2048]
-
blk.9.ffn_down.weightQ6_K[36864 4608]
-
blk.9.ffn_gate.weightQ4_K[4608 36864]
-
blk.9.ffn_norm.weightF32[4608]
-
blk.9.ffn_up.weightQ4_K[4608 36864]
-
blk.9.post_attention_norm.weightF32[4608]
-
blk.9.post_ffw_norm.weightF32[4608]
-
blk.10.attn_k.weightQ4_K[4608 2048]
-
blk.10.attn_norm.weightF32[4608]
-
blk.10.attn_output.weightQ4_K[4096 4608]
-
blk.10.attn_q.weightQ4_K[4608 4096]
-
blk.10.attn_v.weightQ6_K[4608 2048]
-
blk.10.ffn_down.weightQ6_K[36864 4608]
-
blk.10.ffn_gate.weightQ4_K[4608 36864]
-
blk.10.ffn_norm.weightF32[4608]
-
blk.10.ffn_up.weightQ4_K[4608 36864]
-
blk.10.post_attention_norm.weightF32[4608]
-
blk.10.post_ffw_norm.weightF32[4608]
-
blk.11.attn_k.weightQ4_K[4608 2048]
-
blk.11.attn_norm.weightF32[4608]
-
blk.11.attn_output.weightQ4_K[4096 4608]
-
blk.11.attn_q.weightQ4_K[4608 4096]
-
blk.11.attn_v.weightQ6_K[4608 2048]
-
blk.11.ffn_down.weightQ6_K[36864 4608]
-
blk.11.ffn_gate.weightQ4_K[4608 36864]
-
blk.11.ffn_norm.weightF32[4608]
-
blk.11.ffn_up.weightQ4_K[4608 36864]
-
blk.11.post_attention_norm.weightF32[4608]
-
blk.11.post_ffw_norm.weightF32[4608]
-
blk.12.attn_k.weightQ4_K[4608 2048]
-
blk.12.attn_norm.weightF32[4608]
-
blk.12.attn_output.weightQ4_K[4096 4608]
-
blk.12.attn_q.weightQ4_K[4608 4096]
-
blk.12.attn_v.weightQ6_K[4608 2048]
-
blk.12.ffn_down.weightQ6_K[36864 4608]
-
blk.12.ffn_gate.weightQ4_K[4608 36864]
-
blk.12.ffn_norm.weightF32[4608]
-
blk.12.ffn_up.weightQ4_K[4608 36864]
-
blk.12.post_attention_norm.weightF32[4608]
-
blk.12.post_ffw_norm.weightF32[4608]
-
blk.13.attn_k.weightQ4_K[4608 2048]
-
blk.13.attn_norm.weightF32[4608]
-
blk.13.attn_output.weightQ4_K[4096 4608]
-
blk.13.attn_q.weightQ4_K[4608 4096]
-
blk.13.attn_v.weightQ4_K[4608 2048]
-
blk.13.ffn_down.weightQ4_K[36864 4608]
-
blk.13.ffn_gate.weightQ4_K[4608 36864]
-
blk.13.ffn_norm.weightF32[4608]
-
blk.13.ffn_up.weightQ4_K[4608 36864]
-
blk.13.post_attention_norm.weightF32[4608]
-
blk.13.post_ffw_norm.weightF32[4608]
-
blk.14.attn_k.weightQ4_K[4608 2048]
-
blk.14.attn_norm.weightF32[4608]
-
blk.14.attn_output.weightQ4_K[4096 4608]
-
blk.14.attn_q.weightQ4_K[4608 4096]
-
blk.14.attn_v.weightQ4_K[4608 2048]
-
blk.14.ffn_down.weightQ4_K[36864 4608]
-
blk.14.ffn_gate.weightQ4_K[4608 36864]
-
blk.14.ffn_norm.weightF32[4608]
-
blk.14.ffn_up.weightQ4_K[4608 36864]
-
blk.14.post_attention_norm.weightF32[4608]
-
blk.14.post_ffw_norm.weightF32[4608]
-
blk.15.attn_k.weightQ4_K[4608 2048]
-
blk.15.attn_norm.weightF32[4608]
-
blk.15.attn_output.weightQ4_K[4096 4608]
-
blk.15.attn_q.weightQ4_K[4608 4096]
-
blk.15.attn_v.weightQ6_K[4608 2048]
-
blk.15.ffn_down.weightQ6_K[36864 4608]
-
blk.15.ffn_gate.weightQ4_K[4608 36864]
-
blk.15.ffn_norm.weightF32[4608]
-
blk.15.ffn_up.weightQ4_K[4608 36864]
-
blk.15.post_attention_norm.weightF32[4608]
-
blk.15.post_ffw_norm.weightF32[4608]
-
blk.16.attn_k.weightQ4_K[4608 2048]
-
blk.16.attn_norm.weightF32[4608]
-
blk.16.attn_output.weightQ4_K[4096 4608]
-
blk.16.attn_q.weightQ4_K[4608 4096]
-
blk.16.attn_v.weightQ4_K[4608 2048]
-
blk.16.ffn_down.weightQ4_K[36864 4608]
-
blk.16.ffn_gate.weightQ4_K[4608 36864]
-
blk.16.ffn_norm.weightF32[4608]
-
blk.16.ffn_up.weightQ4_K[4608 36864]
-
blk.16.post_attention_norm.weightF32[4608]
-
blk.16.post_ffw_norm.weightF32[4608]
-
blk.17.attn_k.weightQ4_K[4608 2048]
-
blk.17.attn_norm.weightF32[4608]
-
blk.17.attn_output.weightQ4_K[4096 4608]
-
blk.17.attn_q.weightQ4_K[4608 4096]
-
blk.17.attn_v.weightQ4_K[4608 2048]
-
blk.17.ffn_down.weightQ4_K[36864 4608]
-
blk.17.ffn_gate.weightQ4_K[4608 36864]
-
blk.17.ffn_norm.weightF32[4608]
-
blk.17.ffn_up.weightQ4_K[4608 36864]
-
blk.17.post_attention_norm.weightF32[4608]
-
blk.17.post_ffw_norm.weightF32[4608]
-
blk.18.attn_k.weightQ4_K[4608 2048]
-
blk.18.attn_norm.weightF32[4608]
-
blk.18.attn_output.weightQ4_K[4096 4608]
-
blk.18.attn_q.weightQ4_K[4608 4096]
-
blk.18.attn_v.weightQ6_K[4608 2048]
-
blk.18.ffn_down.weightQ6_K[36864 4608]
-
blk.18.ffn_gate.weightQ4_K[4608 36864]
-
blk.18.ffn_norm.weightF32[4608]
-
blk.18.ffn_up.weightQ4_K[4608 36864]
-
blk.18.post_attention_norm.weightF32[4608]
-
blk.18.post_ffw_norm.weightF32[4608]
-
blk.19.attn_k.weightQ4_K[4608 2048]
-
blk.19.attn_norm.weightF32[4608]
-
blk.19.attn_output.weightQ4_K[4096 4608]
-
blk.19.attn_q.weightQ4_K[4608 4096]
-
blk.19.attn_v.weightQ4_K[4608 2048]
-
blk.19.ffn_down.weightQ4_K[36864 4608]
-
blk.19.ffn_gate.weightQ4_K[4608 36864]
-
blk.19.ffn_norm.weightF32[4608]
-
blk.19.ffn_up.weightQ4_K[4608 36864]
-
blk.19.post_attention_norm.weightF32[4608]
-
blk.19.post_ffw_norm.weightF32[4608]
-
blk.20.attn_k.weightQ4_K[4608 2048]
-
blk.20.attn_norm.weightF32[4608]
-
blk.20.attn_output.weightQ4_K[4096 4608]
-
blk.20.attn_q.weightQ4_K[4608 4096]
-
blk.20.attn_v.weightQ6_K[4608 2048]
-
blk.20.ffn_down.weightQ6_K[36864 4608]
-
blk.20.ffn_gate.weightQ4_K[4608 36864]
-
blk.20.ffn_norm.weightF32[4608]
-
blk.20.ffn_up.weightQ4_K[4608 36864]
-
blk.20.post_attention_norm.weightF32[4608]
-
blk.20.post_ffw_norm.weightF32[4608]
-
blk.21.attn_k.weightQ4_K[4608 2048]
-
blk.21.attn_norm.weightF32[4608]
-
blk.21.attn_output.weightQ4_K[4096 4608]
-
blk.21.attn_q.weightQ4_K[4608 4096]
-
blk.21.attn_v.weightQ4_K[4608 2048]
-
blk.21.ffn_down.weightQ4_K[36864 4608]
-
blk.21.ffn_gate.weightQ4_K[4608 36864]
-
blk.21.ffn_norm.weightF32[4608]
-
blk.21.ffn_up.weightQ4_K[4608 36864]
-
blk.21.post_attention_norm.weightF32[4608]
-
blk.21.post_ffw_norm.weightF32[4608]
-
blk.22.attn_k.weightQ4_K[4608 2048]
-
blk.22.attn_norm.weightF32[4608]
-
blk.22.attn_output.weightQ4_K[4096 4608]
-
blk.22.attn_q.weightQ4_K[4608 4096]
-
blk.22.attn_v.weightQ4_K[4608 2048]
-
blk.22.ffn_down.weightQ4_K[36864 4608]
-
blk.22.ffn_gate.weightQ4_K[4608 36864]
-
blk.22.ffn_norm.weightF32[4608]
-
blk.22.ffn_up.weightQ4_K[4608 36864]
-
blk.22.post_attention_norm.weightF32[4608]
-
blk.22.post_ffw_norm.weightF32[4608]
-
blk.23.attn_k.weightQ4_K[4608 2048]
-
blk.23.attn_norm.weightF32[4608]
-
blk.23.attn_output.weightQ4_K[4096 4608]
-
blk.23.attn_q.weightQ4_K[4608 4096]
-
blk.23.attn_v.weightQ6_K[4608 2048]
-
blk.23.ffn_down.weightQ6_K[36864 4608]
-
blk.23.ffn_gate.weightQ4_K[4608 36864]
-
blk.23.ffn_norm.weightF32[4608]
-
blk.23.ffn_up.weightQ4_K[4608 36864]
-
blk.23.post_attention_norm.weightF32[4608]
-
blk.23.post_ffw_norm.weightF32[4608]
-
blk.24.attn_k.weightQ4_K[4608 2048]
-
blk.24.attn_norm.weightF32[4608]
-
blk.24.attn_output.weightQ4_K[4096 4608]
-
blk.24.attn_q.weightQ4_K[4608 4096]
-
blk.24.attn_v.weightQ4_K[4608 2048]
-
blk.24.ffn_down.weightQ4_K[36864 4608]
-
blk.24.ffn_gate.weightQ4_K[4608 36864]
-
blk.24.ffn_norm.weightF32[4608]
-
blk.24.ffn_up.weightQ4_K[4608 36864]
-
blk.24.post_attention_norm.weightF32[4608]
-
blk.24.post_ffw_norm.weightF32[4608]
-
blk.25.attn_k.weightQ4_K[4608 2048]
-
blk.25.attn_norm.weightF32[4608]
-
blk.25.attn_output.weightQ4_K[4096 4608]
-
blk.25.attn_q.weightQ4_K[4608 4096]
-
blk.25.attn_v.weightQ4_K[4608 2048]
-
blk.25.ffn_down.weightQ4_K[36864 4608]
-
blk.25.ffn_gate.weightQ4_K[4608 36864]
-
blk.25.ffn_norm.weightF32[4608]
-
blk.25.ffn_up.weightQ4_K[4608 36864]
-
blk.25.post_attention_norm.weightF32[4608]
-
blk.25.post_ffw_norm.weightF32[4608]
-
blk.26.attn_k.weightQ4_K[4608 2048]
-
blk.26.attn_norm.weightF32[4608]
-
blk.26.attn_output.weightQ4_K[4096 4608]
-
blk.26.attn_q.weightQ4_K[4608 4096]
-
blk.26.attn_v.weightQ6_K[4608 2048]
-
blk.26.ffn_down.weightQ6_K[36864 4608]
-
blk.26.ffn_gate.weightQ4_K[4608 36864]
-
blk.26.ffn_norm.weightF32[4608]
-
blk.26.ffn_up.weightQ4_K[4608 36864]
-
blk.26.post_attention_norm.weightF32[4608]
-
blk.26.post_ffw_norm.weightF32[4608]
-
blk.27.attn_k.weightQ4_K[4608 2048]
-
blk.27.attn_norm.weightF32[4608]
-
blk.27.attn_output.weightQ4_K[4096 4608]
-
blk.27.attn_q.weightQ4_K[4608 4096]
-
blk.27.attn_v.weightQ4_K[4608 2048]
-
blk.27.ffn_down.weightQ4_K[36864 4608]
-
blk.27.ffn_gate.weightQ4_K[4608 36864]
-
blk.27.ffn_norm.weightF32[4608]
-
blk.27.ffn_up.weightQ4_K[4608 36864]
-
blk.27.post_attention_norm.weightF32[4608]
-
blk.27.post_ffw_norm.weightF32[4608]
-
blk.28.attn_k.weightQ4_K[4608 2048]
-
blk.28.attn_norm.weightF32[4608]
-
blk.28.attn_output.weightQ4_K[4096 4608]
-
blk.28.attn_q.weightQ4_K[4608 4096]
-
blk.28.attn_v.weightQ4_K[4608 2048]
-
blk.28.ffn_down.weightQ4_K[36864 4608]
-
blk.28.ffn_gate.weightQ4_K[4608 36864]
-
blk.28.ffn_norm.weightF32[4608]
-
blk.28.ffn_up.weightQ4_K[4608 36864]
-
blk.28.post_attention_norm.weightF32[4608]
-
blk.28.post_ffw_norm.weightF32[4608]
-
blk.29.attn_k.weightQ4_K[4608 2048]
-
blk.29.attn_norm.weightF32[4608]
-
blk.29.attn_output.weightQ4_K[4096 4608]
-
blk.29.attn_q.weightQ4_K[4608 4096]
-
blk.29.attn_v.weightQ6_K[4608 2048]
-
blk.29.ffn_down.weightQ6_K[36864 4608]
-
blk.29.ffn_gate.weightQ4_K[4608 36864]
-
blk.29.ffn_norm.weightF32[4608]
-
blk.29.ffn_up.weightQ4_K[4608 36864]
-
blk.29.post_attention_norm.weightF32[4608]
-
blk.29.post_ffw_norm.weightF32[4608]
-
blk.30.attn_k.weightQ4_K[4608 2048]
-
blk.30.attn_norm.weightF32[4608]
-
blk.30.attn_output.weightQ4_K[4096 4608]
-
blk.30.attn_q.weightQ4_K[4608 4096]
-
blk.30.attn_v.weightQ4_K[4608 2048]
-
blk.30.ffn_down.weightQ4_K[36864 4608]
-
blk.30.ffn_gate.weightQ4_K[4608 36864]
-
blk.30.ffn_norm.weightF32[4608]
-
blk.30.ffn_up.weightQ4_K[4608 36864]
-
blk.30.post_attention_norm.weightF32[4608]
-
blk.30.post_ffw_norm.weightF32[4608]
-
blk.31.attn_k.weightQ4_K[4608 2048]
-
blk.31.attn_norm.weightF32[4608]
-
blk.31.attn_output.weightQ4_K[4096 4608]
-
blk.31.attn_q.weightQ4_K[4608 4096]
-
blk.31.attn_v.weightQ6_K[4608 2048]
-
blk.31.ffn_down.weightQ6_K[36864 4608]
-
blk.31.ffn_gate.weightQ4_K[4608 36864]
-
blk.31.ffn_norm.weightF32[4608]
-
blk.31.ffn_up.weightQ4_K[4608 36864]
-
blk.31.post_attention_norm.weightF32[4608]
-
blk.31.post_ffw_norm.weightF32[4608]
-
blk.32.attn_k.weightQ4_K[4608 2048]
-
blk.32.attn_norm.weightF32[4608]
-
blk.32.attn_output.weightQ4_K[4096 4608]
-
blk.32.attn_q.weightQ4_K[4608 4096]
-
blk.32.attn_v.weightQ4_K[4608 2048]
-
blk.32.ffn_down.weightQ4_K[36864 4608]
-
blk.32.ffn_gate.weightQ4_K[4608 36864]
-
blk.32.ffn_norm.weightF32[4608]
-
blk.32.ffn_up.weightQ4_K[4608 36864]
-
blk.32.post_attention_norm.weightF32[4608]
-
blk.32.post_ffw_norm.weightF32[4608]
-
blk.33.attn_k.weightQ4_K[4608 2048]
-
blk.33.attn_norm.weightF32[4608]
-
blk.33.attn_output.weightQ4_K[4096 4608]
-
blk.33.attn_q.weightQ4_K[4608 4096]
-
blk.33.attn_v.weightQ4_K[4608 2048]
-
blk.33.ffn_down.weightQ4_K[36864 4608]
-
blk.33.ffn_gate.weightQ4_K[4608 36864]
-
blk.33.ffn_norm.weightF32[4608]
-
blk.33.ffn_up.weightQ4_K[4608 36864]
-
blk.33.post_attention_norm.weightF32[4608]
-
blk.33.post_ffw_norm.weightF32[4608]
-
blk.34.attn_k.weightQ4_K[4608 2048]
-
blk.34.attn_norm.weightF32[4608]
-
blk.34.attn_output.weightQ4_K[4096 4608]
-
blk.34.attn_q.weightQ4_K[4608 4096]
-
blk.34.attn_v.weightQ6_K[4608 2048]
-
blk.34.ffn_down.weightQ6_K[36864 4608]
-
blk.34.ffn_gate.weightQ4_K[4608 36864]
-
blk.34.ffn_norm.weightF32[4608]
-
blk.34.ffn_up.weightQ4_K[4608 36864]
-
blk.34.post_attention_norm.weightF32[4608]
-
blk.34.post_ffw_norm.weightF32[4608]
-
blk.35.attn_k.weightQ4_K[4608 2048]
-
blk.35.attn_norm.weightF32[4608]
-
blk.35.attn_output.weightQ4_K[4096 4608]
-
blk.35.attn_q.weightQ4_K[4608 4096]
-
blk.35.attn_v.weightQ4_K[4608 2048]
-
blk.35.ffn_down.weightQ4_K[36864 4608]
-
blk.35.ffn_gate.weightQ4_K[4608 36864]
-
blk.35.ffn_norm.weightF32[4608]
-
blk.35.ffn_up.weightQ4_K[4608 36864]
-
blk.35.post_attention_norm.weightF32[4608]
-
blk.35.post_ffw_norm.weightF32[4608]
-
blk.36.attn_k.weightQ4_K[4608 2048]
-
blk.36.attn_norm.weightF32[4608]
-
blk.36.attn_output.weightQ4_K[4096 4608]
-
blk.36.attn_q.weightQ4_K[4608 4096]
-
blk.36.attn_v.weightQ4_K[4608 2048]
-
blk.36.ffn_down.weightQ4_K[36864 4608]
-
blk.36.ffn_gate.weightQ4_K[4608 36864]
-
blk.36.ffn_norm.weightF32[4608]
-
blk.36.ffn_up.weightQ4_K[4608 36864]
-
blk.36.post_attention_norm.weightF32[4608]
-
blk.36.post_ffw_norm.weightF32[4608]
-
blk.37.attn_k.weightQ4_K[4608 2048]
-
blk.37.attn_norm.weightF32[4608]
-
blk.37.attn_output.weightQ4_K[4096 4608]
-
blk.37.attn_q.weightQ4_K[4608 4096]
-
blk.37.attn_v.weightQ6_K[4608 2048]
-
blk.37.ffn_down.weightQ6_K[36864 4608]
-
blk.37.ffn_gate.weightQ4_K[4608 36864]
-
blk.37.ffn_norm.weightF32[4608]
-
blk.37.ffn_up.weightQ4_K[4608 36864]
-
blk.37.post_attention_norm.weightF32[4608]
-
blk.37.post_ffw_norm.weightF32[4608]
-
blk.38.attn_k.weightQ4_K[4608 2048]
-
blk.38.attn_norm.weightF32[4608]
-
blk.38.attn_output.weightQ4_K[4096 4608]
-
blk.38.attn_q.weightQ4_K[4608 4096]
-
blk.38.attn_v.weightQ4_K[4608 2048]
-
blk.38.ffn_down.weightQ4_K[36864 4608]
-
blk.38.ffn_gate.weightQ4_K[4608 36864]
-
blk.38.ffn_norm.weightF32[4608]
-
blk.38.ffn_up.weightQ4_K[4608 36864]
-
blk.38.post_attention_norm.weightF32[4608]
-
blk.38.post_ffw_norm.weightF32[4608]
-
blk.39.attn_k.weightQ4_K[4608 2048]
-
blk.39.attn_norm.weightF32[4608]
-
blk.39.attn_output.weightQ4_K[4096 4608]
-
blk.39.attn_q.weightQ4_K[4608 4096]
-
blk.39.attn_v.weightQ4_K[4608 2048]
-
blk.39.ffn_down.weightQ4_K[36864 4608]
-
blk.39.ffn_gate.weightQ4_K[4608 36864]
-
blk.39.ffn_norm.weightF32[4608]
-
blk.39.ffn_up.weightQ4_K[4608 36864]
-
blk.39.post_attention_norm.weightF32[4608]
-
blk.39.post_ffw_norm.weightF32[4608]
-
blk.40.attn_k.weightQ4_K[4608 2048]
-
blk.40.attn_norm.weightF32[4608]
-
blk.40.attn_output.weightQ4_K[4096 4608]
-
blk.40.attn_q.weightQ4_K[4608 4096]
-
blk.40.attn_v.weightQ4_K[4608 2048]
-
blk.40.ffn_down.weightQ4_K[36864 4608]
-
blk.40.ffn_gate.weightQ4_K[4608 36864]
-
blk.40.ffn_norm.weightF32[4608]
-
blk.40.ffn_up.weightQ4_K[4608 36864]
-
blk.40.post_attention_norm.weightF32[4608]
-
blk.40.post_ffw_norm.weightF32[4608]
-
blk.41.attn_k.weightQ4_K[4608 2048]
-
blk.41.attn_norm.weightF32[4608]
-
blk.41.attn_output.weightQ4_K[4096 4608]
-
blk.41.attn_q.weightQ4_K[4608 4096]
-
blk.41.attn_v.weightQ4_K[4608 2048]
-
blk.41.ffn_down.weightQ4_K[36864 4608]
-
blk.41.ffn_gate.weightQ4_K[4608 36864]
-
blk.41.ffn_norm.weightF32[4608]
-
blk.41.ffn_up.weightQ4_K[4608 36864]
-
blk.41.post_attention_norm.weightF32[4608]
-
blk.41.post_ffw_norm.weightF32[4608]
-
blk.42.attn_k.weightQ4_K[4608 2048]
-
blk.42.attn_norm.weightF32[4608]
-
blk.42.attn_output.weightQ4_K[4096 4608]
-
blk.42.attn_q.weightQ4_K[4608 4096]
-
blk.42.attn_v.weightQ6_K[4608 2048]
-
blk.42.ffn_down.weightQ6_K[36864 4608]
-
blk.42.ffn_gate.weightQ4_K[4608 36864]
-
blk.42.ffn_norm.weightF32[4608]
-
blk.42.ffn_up.weightQ4_K[4608 36864]
-
blk.42.post_attention_norm.weightF32[4608]
-
blk.42.post_ffw_norm.weightF32[4608]
-
blk.43.attn_k.weightQ4_K[4608 2048]
-
blk.43.attn_norm.weightF32[4608]
-
blk.43.attn_output.weightQ4_K[4096 4608]
-
blk.43.attn_q.weightQ4_K[4608 4096]
-
blk.43.attn_v.weightQ4_K[4608 2048]
-
blk.43.ffn_down.weightQ4_K[36864 4608]
-
blk.43.ffn_gate.weightQ4_K[4608 36864]
-
blk.43.ffn_norm.weightF32[4608]
-
blk.43.ffn_up.weightQ4_K[4608 36864]
-
blk.43.post_attention_norm.weightF32[4608]
-
blk.43.post_ffw_norm.weightF32[4608]
-
blk.44.attn_k.weightQ4_K[4608 2048]
-
blk.44.attn_norm.weightF32[4608]
-
blk.44.attn_output.weightQ4_K[4096 4608]
-
blk.44.attn_q.weightQ4_K[4608 4096]
-
blk.44.attn_v.weightQ4_K[4608 2048]
-
blk.44.ffn_down.weightQ4_K[36864 4608]
-
blk.44.ffn_gate.weightQ4_K[4608 36864]
-
blk.44.ffn_norm.weightF32[4608]
-
blk.44.ffn_up.weightQ4_K[4608 36864]
-
blk.44.post_attention_norm.weightF32[4608]
-
blk.44.post_ffw_norm.weightF32[4608]
-
blk.45.attn_k.weightQ4_K[4608 2048]
-
blk.45.attn_norm.weightF32[4608]
-
blk.45.attn_output.weightQ4_K[4096 4608]
-
blk.45.attn_q.weightQ4_K[4608 4096]
-
blk.45.attn_v.weightQ6_K[4608 2048]
-
blk.45.ffn_down.weightQ6_K[36864 4608]
-
blk.45.ffn_gate.weightQ4_K[4608 36864]
-
blk.45.ffn_norm.weightF32[4608]
-
blk.45.ffn_up.weightQ4_K[4608 36864]
-
blk.45.post_attention_norm.weightF32[4608]
-
blk.45.post_ffw_norm.weightF32[4608]
-
output_norm.weightF32[4608]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45