latest
17GB
google/gemma-2-27b-it Korean q4 model with CPT->SFT->DPO
27B
6 Pulls Updated 13 days ago
0fb76fdd8025 · 17GB
-
general.architecturegemma2
-
general.file_typeQ4_K_M
-
gemma2.attention.head_count32
-
gemma2.attention.head_count_kv16
-
gemma2.attention.key_length128
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length128
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count46
-
gemma2.context_length8192
-
gemma2.embedding_length4608
-
gemma2.feed_forward_length36864
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id1
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[4608 256000]
-
blk.0.attn_norm.weightF32[4608]
-
blk.0.ffn_down.weightQ6_K[36864 4608]
-
blk.0.ffn_gate.weightQ4_K[4608 36864]
-
blk.0.ffn_up.weightQ4_K[4608 36864]
-
blk.0.post_attention_norm.weightF32[4608]
-
blk.0.post_ffw_norm.weightF32[4608]
-
blk.0.ffn_norm.weightF32[4608]
-
blk.0.attn_k.weightQ4_K[4608 2048]
-
blk.0.attn_output.weightQ4_K[4096 4608]
-
blk.0.attn_q.weightQ4_K[4608 4096]
-
blk.0.attn_v.weightQ6_K[4608 2048]
-
blk.1.attn_norm.weightF32[4608]
-
blk.1.ffn_down.weightQ6_K[36864 4608]
-
blk.1.ffn_gate.weightQ4_K[4608 36864]
-
blk.1.ffn_up.weightQ4_K[4608 36864]
-
blk.1.post_attention_norm.weightF32[4608]
-
blk.1.post_ffw_norm.weightF32[4608]
-
blk.1.ffn_norm.weightF32[4608]
-
blk.1.attn_k.weightQ4_K[4608 2048]
-
blk.1.attn_output.weightQ4_K[4096 4608]
-
blk.1.attn_q.weightQ4_K[4608 4096]
-
blk.1.attn_v.weightQ6_K[4608 2048]
-
blk.2.attn_k.weightQ4_K[4608 2048]
-
blk.2.attn_output.weightQ4_K[4096 4608]
-
blk.2.attn_q.weightQ4_K[4608 4096]
-
blk.2.attn_v.weightQ6_K[4608 2048]
-
blk.2.attn_norm.weightF32[4608]
-
blk.2.ffn_down.weightQ6_K[36864 4608]
-
blk.2.ffn_gate.weightQ4_K[4608 36864]
-
blk.2.ffn_up.weightQ4_K[4608 36864]
-
blk.2.post_attention_norm.weightF32[4608]
-
blk.2.post_ffw_norm.weightF32[4608]
-
blk.2.ffn_norm.weightF32[4608]
-
blk.3.attn_norm.weightF32[4608]
-
blk.3.ffn_down.weightQ6_K[36864 4608]
-
blk.3.ffn_gate.weightQ4_K[4608 36864]
-
blk.3.ffn_up.weightQ4_K[4608 36864]
-
blk.3.post_attention_norm.weightF32[4608]
-
blk.3.post_ffw_norm.weightF32[4608]
-
blk.3.ffn_norm.weightF32[4608]
-
blk.3.attn_k.weightQ4_K[4608 2048]
-
blk.3.attn_output.weightQ4_K[4096 4608]
-
blk.3.attn_q.weightQ4_K[4608 4096]
-
blk.3.attn_v.weightQ6_K[4608 2048]
-
blk.4.attn_norm.weightF32[4608]
-
blk.4.ffn_down.weightQ6_K[36864 4608]
-
blk.4.ffn_gate.weightQ4_K[4608 36864]
-
blk.4.ffn_up.weightQ4_K[4608 36864]
-
blk.4.post_attention_norm.weightF32[4608]
-
blk.4.post_ffw_norm.weightF32[4608]
-
blk.4.ffn_norm.weightF32[4608]
-
blk.4.attn_k.weightQ4_K[4608 2048]
-
blk.4.attn_output.weightQ4_K[4096 4608]
-
blk.4.attn_q.weightQ4_K[4608 4096]
-
blk.4.attn_v.weightQ6_K[4608 2048]
-
blk.5.attn_norm.weightF32[4608]
-
blk.5.ffn_down.weightQ4_K[36864 4608]
-
blk.5.ffn_gate.weightQ4_K[4608 36864]
-
blk.5.ffn_up.weightQ4_K[4608 36864]
-
blk.5.post_attention_norm.weightF32[4608]
-
blk.5.post_ffw_norm.weightF32[4608]
-
blk.5.ffn_norm.weightF32[4608]
-
blk.5.attn_k.weightQ4_K[4608 2048]
-
blk.5.attn_output.weightQ4_K[4096 4608]
-
blk.5.attn_q.weightQ4_K[4608 4096]
-
blk.5.attn_v.weightQ4_K[4608 2048]
-
blk.6.ffn_gate.weightQ4_K[4608 36864]
-
blk.6.attn_k.weightQ4_K[4608 2048]
-
blk.6.attn_output.weightQ4_K[4096 4608]
-
blk.6.attn_q.weightQ4_K[4608 4096]
-
blk.6.attn_v.weightQ4_K[4608 2048]
-
blk.6.attn_norm.weightF32[4608]
-
blk.6.ffn_down.weightQ4_K[36864 4608]
-
blk.6.ffn_up.weightQ4_K[4608 36864]
-
blk.6.post_attention_norm.weightF32[4608]
-
blk.6.post_ffw_norm.weightF32[4608]
-
blk.6.ffn_norm.weightF32[4608]
-
blk.7.attn_norm.weightF32[4608]
-
blk.7.ffn_down.weightQ6_K[36864 4608]
-
blk.7.ffn_gate.weightQ4_K[4608 36864]
-
blk.7.ffn_up.weightQ4_K[4608 36864]
-
blk.7.post_attention_norm.weightF32[4608]
-
blk.7.post_ffw_norm.weightF32[4608]
-
blk.7.ffn_norm.weightF32[4608]
-
blk.7.attn_k.weightQ4_K[4608 2048]
-
blk.7.attn_output.weightQ4_K[4096 4608]
-
blk.7.attn_q.weightQ4_K[4608 4096]
-
blk.7.attn_v.weightQ4_K[4608 2048]
-
blk.8.attn_norm.weightF32[4608]
-
blk.8.ffn_down.weightQ4_K[36864 4608]
-
blk.8.ffn_gate.weightQ4_K[4608 36864]
-
blk.8.ffn_up.weightQ4_K[4608 36864]
-
blk.8.post_attention_norm.weightF32[4608]
-
blk.8.post_ffw_norm.weightF32[4608]
-
blk.8.ffn_norm.weightF32[4608]
-
blk.8.attn_k.weightQ4_K[4608 2048]
-
blk.8.attn_output.weightQ4_K[4096 4608]
-
blk.8.attn_q.weightQ4_K[4608 4096]
-
blk.8.attn_v.weightQ4_K[4608 2048]
-
blk.9.attn_norm.weightF32[4608]
-
blk.9.ffn_down.weightQ4_K[36864 4608]
-
blk.9.ffn_gate.weightQ4_K[4608 36864]
-
blk.9.ffn_up.weightQ4_K[4608 36864]
-
blk.9.post_attention_norm.weightF32[4608]
-
blk.9.post_ffw_norm.weightF32[4608]
-
blk.9.ffn_norm.weightF32[4608]
-
blk.9.attn_k.weightQ4_K[4608 2048]
-
blk.9.attn_output.weightQ4_K[4096 4608]
-
blk.9.attn_q.weightQ4_K[4608 4096]
-
blk.9.attn_v.weightQ6_K[4608 2048]
-
blk.10.ffn_gate.weightQ4_K[4608 36864]
-
blk.10.ffn_up.weightQ4_K[4608 36864]
-
blk.10.attn_k.weightQ4_K[4608 2048]
-
blk.10.attn_output.weightQ4_K[4096 4608]
-
blk.10.attn_q.weightQ4_K[4608 4096]
-
blk.10.attn_v.weightQ6_K[4608 2048]
-
blk.10.attn_norm.weightF32[4608]
-
blk.10.ffn_down.weightQ6_K[36864 4608]
-
blk.10.post_attention_norm.weightF32[4608]
-
blk.10.post_ffw_norm.weightF32[4608]
-
blk.10.ffn_norm.weightF32[4608]
-
blk.11.attn_norm.weightF32[4608]
-
blk.11.ffn_down.weightQ4_K[36864 4608]
-
blk.11.ffn_gate.weightQ4_K[4608 36864]
-
blk.11.ffn_up.weightQ4_K[4608 36864]
-
blk.11.post_attention_norm.weightF32[4608]
-
blk.11.post_ffw_norm.weightF32[4608]
-
blk.11.ffn_norm.weightF32[4608]
-
blk.11.attn_k.weightQ4_K[4608 2048]
-
blk.11.attn_output.weightQ4_K[4096 4608]
-
blk.11.attn_q.weightQ4_K[4608 4096]
-
blk.11.attn_v.weightQ4_K[4608 2048]
-
blk.12.attn_norm.weightF32[4608]
-
blk.12.ffn_down.weightQ4_K[36864 4608]
-
blk.12.ffn_gate.weightQ4_K[4608 36864]
-
blk.12.ffn_up.weightQ4_K[4608 36864]
-
blk.12.post_attention_norm.weightF32[4608]
-
blk.12.post_ffw_norm.weightF32[4608]
-
blk.12.ffn_norm.weightF32[4608]
-
blk.12.attn_k.weightQ4_K[4608 2048]
-
blk.12.attn_output.weightQ4_K[4096 4608]
-
blk.12.attn_q.weightQ4_K[4608 4096]
-
blk.12.attn_v.weightQ4_K[4608 2048]
-
blk.13.attn_norm.weightF32[4608]
-
blk.13.ffn_down.weightQ6_K[36864 4608]
-
blk.13.ffn_gate.weightQ4_K[4608 36864]
-
blk.13.ffn_up.weightQ4_K[4608 36864]
-
blk.13.post_attention_norm.weightF32[4608]
-
blk.13.post_ffw_norm.weightF32[4608]
-
blk.13.ffn_norm.weightF32[4608]
-
blk.13.attn_k.weightQ4_K[4608 2048]
-
blk.13.attn_output.weightQ4_K[4096 4608]
-
blk.13.attn_q.weightQ4_K[4608 4096]
-
blk.13.attn_v.weightQ6_K[4608 2048]
-
blk.14.attn_norm.weightF32[4608]
-
blk.14.ffn_down.weightQ4_K[36864 4608]
-
blk.14.ffn_gate.weightQ4_K[4608 36864]
-
blk.14.ffn_up.weightQ4_K[4608 36864]
-
blk.14.post_attention_norm.weightF32[4608]
-
blk.14.post_ffw_norm.weightF32[4608]
-
blk.14.ffn_norm.weightF32[4608]
-
blk.14.attn_k.weightQ4_K[4608 2048]
-
blk.14.attn_output.weightQ4_K[4096 4608]
-
blk.14.attn_q.weightQ4_K[4608 4096]
-
blk.14.attn_v.weightQ4_K[4608 2048]
-
blk.15.attn_k.weightQ4_K[4608 2048]
-
blk.15.attn_output.weightQ4_K[4096 4608]
-
blk.15.attn_q.weightQ4_K[4608 4096]
-
blk.15.attn_v.weightQ4_K[4608 2048]
-
blk.15.attn_norm.weightF32[4608]
-
blk.15.ffn_down.weightQ4_K[36864 4608]
-
blk.15.ffn_gate.weightQ4_K[4608 36864]
-
blk.15.ffn_up.weightQ4_K[4608 36864]
-
blk.15.post_attention_norm.weightF32[4608]
-
blk.15.post_ffw_norm.weightF32[4608]
-
blk.15.ffn_norm.weightF32[4608]
-
blk.16.attn_norm.weightF32[4608]
-
blk.16.ffn_down.weightQ6_K[36864 4608]
-
blk.16.ffn_gate.weightQ4_K[4608 36864]
-
blk.16.ffn_up.weightQ4_K[4608 36864]
-
blk.16.post_attention_norm.weightF32[4608]
-
blk.16.post_ffw_norm.weightF32[4608]
-
blk.16.ffn_norm.weightF32[4608]
-
blk.16.attn_k.weightQ4_K[4608 2048]
-
blk.16.attn_output.weightQ4_K[4096 4608]
-
blk.16.attn_q.weightQ4_K[4608 4096]
-
blk.16.attn_v.weightQ6_K[4608 2048]
-
blk.17.attn_norm.weightF32[4608]
-
blk.17.ffn_down.weightQ4_K[36864 4608]
-
blk.17.ffn_gate.weightQ4_K[4608 36864]
-
blk.17.ffn_up.weightQ4_K[4608 36864]
-
blk.17.post_attention_norm.weightF32[4608]
-
blk.17.post_ffw_norm.weightF32[4608]
-
blk.17.ffn_norm.weightF32[4608]
-
blk.17.attn_k.weightQ4_K[4608 2048]
-
blk.17.attn_output.weightQ4_K[4096 4608]
-
blk.17.attn_q.weightQ4_K[4608 4096]
-
blk.17.attn_v.weightQ4_K[4608 2048]
-
blk.18.attn_norm.weightF32[4608]
-
blk.18.ffn_down.weightQ4_K[36864 4608]
-
blk.18.ffn_gate.weightQ4_K[4608 36864]
-
blk.18.ffn_up.weightQ4_K[4608 36864]
-
blk.18.post_attention_norm.weightF32[4608]
-
blk.18.post_ffw_norm.weightF32[4608]
-
blk.18.ffn_norm.weightF32[4608]
-
blk.18.attn_k.weightQ4_K[4608 2048]
-
blk.18.attn_output.weightQ4_K[4096 4608]
-
blk.18.attn_q.weightQ4_K[4608 4096]
-
blk.18.attn_v.weightQ4_K[4608 2048]
-
blk.19.ffn_gate.weightQ4_K[4608 36864]
-
blk.19.attn_k.weightQ4_K[4608 2048]
-
blk.19.attn_output.weightQ4_K[4096 4608]
-
blk.19.attn_q.weightQ4_K[4608 4096]
-
blk.19.attn_v.weightQ6_K[4608 2048]
-
blk.19.attn_norm.weightF32[4608]
-
blk.19.ffn_down.weightQ6_K[36864 4608]
-
blk.19.ffn_up.weightQ4_K[4608 36864]
-
blk.19.post_attention_norm.weightF32[4608]
-
blk.19.post_ffw_norm.weightF32[4608]
-
blk.19.ffn_norm.weightF32[4608]
-
blk.20.attn_norm.weightF32[4608]
-
blk.20.ffn_down.weightQ4_K[36864 4608]
-
blk.20.ffn_gate.weightQ4_K[4608 36864]
-
blk.20.ffn_up.weightQ4_K[4608 36864]
-
blk.20.post_attention_norm.weightF32[4608]
-
blk.20.post_ffw_norm.weightF32[4608]
-
blk.20.ffn_norm.weightF32[4608]
-
blk.20.attn_k.weightQ4_K[4608 2048]
-
blk.20.attn_output.weightQ4_K[4096 4608]
-
blk.20.attn_q.weightQ4_K[4608 4096]
-
blk.20.attn_v.weightQ4_K[4608 2048]
-
blk.21.attn_norm.weightF32[4608]
-
blk.21.ffn_down.weightQ4_K[36864 4608]
-
blk.21.ffn_gate.weightQ4_K[4608 36864]
-
blk.21.ffn_up.weightQ4_K[4608 36864]
-
blk.21.post_attention_norm.weightF32[4608]
-
blk.21.post_ffw_norm.weightF32[4608]
-
blk.21.ffn_norm.weightF32[4608]
-
blk.21.attn_k.weightQ4_K[4608 2048]
-
blk.21.attn_output.weightQ4_K[4096 4608]
-
blk.21.attn_q.weightQ4_K[4608 4096]
-
blk.21.attn_v.weightQ4_K[4608 2048]
-
blk.22.attn_norm.weightF32[4608]
-
blk.22.ffn_down.weightQ6_K[36864 4608]
-
blk.22.ffn_gate.weightQ4_K[4608 36864]
-
blk.22.ffn_up.weightQ4_K[4608 36864]
-
blk.22.post_attention_norm.weightF32[4608]
-
blk.22.post_ffw_norm.weightF32[4608]
-
blk.22.ffn_norm.weightF32[4608]
-
blk.22.attn_k.weightQ4_K[4608 2048]
-
blk.22.attn_output.weightQ4_K[4096 4608]
-
blk.22.attn_q.weightQ4_K[4608 4096]
-
blk.22.attn_v.weightQ6_K[4608 2048]
-
blk.23.ffn_gate.weightQ4_K[4608 36864]
-
blk.23.ffn_up.weightQ4_K[4608 36864]
-
blk.23.attn_k.weightQ4_K[4608 2048]
-
blk.23.attn_output.weightQ4_K[4096 4608]
-
blk.23.attn_q.weightQ4_K[4608 4096]
-
blk.23.attn_v.weightQ4_K[4608 2048]
-
blk.23.attn_norm.weightF32[4608]
-
blk.23.ffn_down.weightQ4_K[36864 4608]
-
blk.23.post_attention_norm.weightF32[4608]
-
blk.23.post_ffw_norm.weightF32[4608]
-
blk.23.ffn_norm.weightF32[4608]
-
blk.24.attn_norm.weightF32[4608]
-
blk.24.ffn_down.weightQ4_K[36864 4608]
-
blk.24.ffn_gate.weightQ4_K[4608 36864]
-
blk.24.ffn_up.weightQ4_K[4608 36864]
-
blk.24.post_attention_norm.weightF32[4608]
-
blk.24.post_ffw_norm.weightF32[4608]
-
blk.24.ffn_norm.weightF32[4608]
-
blk.24.attn_k.weightQ4_K[4608 2048]
-
blk.24.attn_output.weightQ4_K[4096 4608]
-
blk.24.attn_q.weightQ4_K[4608 4096]
-
blk.24.attn_v.weightQ4_K[4608 2048]
-
blk.25.attn_norm.weightF32[4608]
-
blk.25.ffn_down.weightQ6_K[36864 4608]
-
blk.25.ffn_gate.weightQ4_K[4608 36864]
-
blk.25.ffn_up.weightQ4_K[4608 36864]
-
blk.25.post_attention_norm.weightF32[4608]
-
blk.25.post_ffw_norm.weightF32[4608]
-
blk.25.ffn_norm.weightF32[4608]
-
blk.25.attn_k.weightQ4_K[4608 2048]
-
blk.25.attn_output.weightQ4_K[4096 4608]
-
blk.25.attn_q.weightQ4_K[4608 4096]
-
blk.25.attn_v.weightQ6_K[4608 2048]
-
blk.26.attn_norm.weightF32[4608]
-
blk.26.ffn_down.weightQ4_K[36864 4608]
-
blk.26.ffn_gate.weightQ4_K[4608 36864]
-
blk.26.ffn_up.weightQ4_K[4608 36864]
-
blk.26.post_attention_norm.weightF32[4608]
-
blk.26.post_ffw_norm.weightF32[4608]
-
blk.26.ffn_norm.weightF32[4608]
-
blk.26.attn_k.weightQ4_K[4608 2048]
-
blk.26.attn_output.weightQ4_K[4096 4608]
-
blk.26.attn_q.weightQ4_K[4608 4096]
-
blk.26.attn_v.weightQ4_K[4608 2048]
-
blk.27.attn_norm.weightF32[4608]
-
blk.27.ffn_down.weightQ4_K[36864 4608]
-
blk.27.ffn_gate.weightQ4_K[4608 36864]
-
blk.27.ffn_up.weightQ4_K[4608 36864]
-
blk.27.post_attention_norm.weightF32[4608]
-
blk.27.post_ffw_norm.weightF32[4608]
-
blk.27.ffn_norm.weightF32[4608]
-
blk.27.attn_k.weightQ4_K[4608 2048]
-
blk.27.attn_output.weightQ4_K[4096 4608]
-
blk.27.attn_q.weightQ4_K[4608 4096]
-
blk.27.attn_v.weightQ4_K[4608 2048]
-
blk.28.attn_k.weightQ4_K[4608 2048]
-
blk.28.attn_output.weightQ4_K[4096 4608]
-
blk.28.attn_q.weightQ4_K[4608 4096]
-
blk.28.attn_v.weightQ6_K[4608 2048]
-
blk.28.attn_norm.weightF32[4608]
-
blk.28.ffn_down.weightQ6_K[36864 4608]
-
blk.28.ffn_gate.weightQ4_K[4608 36864]
-
blk.28.ffn_up.weightQ4_K[4608 36864]
-
blk.28.post_attention_norm.weightF32[4608]
-
blk.28.post_ffw_norm.weightF32[4608]
-
blk.28.ffn_norm.weightF32[4608]
-
blk.29.attn_norm.weightF32[4608]
-
blk.29.ffn_down.weightQ4_K[36864 4608]
-
blk.29.ffn_gate.weightQ4_K[4608 36864]
-
blk.29.ffn_up.weightQ4_K[4608 36864]
-
blk.29.post_attention_norm.weightF32[4608]
-
blk.29.post_ffw_norm.weightF32[4608]
-
blk.29.ffn_norm.weightF32[4608]
-
blk.29.attn_k.weightQ4_K[4608 2048]
-
blk.29.attn_output.weightQ4_K[4096 4608]
-
blk.29.attn_q.weightQ4_K[4608 4096]
-
blk.29.attn_v.weightQ4_K[4608 2048]
-
blk.30.attn_norm.weightF32[4608]
-
blk.30.ffn_down.weightQ4_K[36864 4608]
-
blk.30.ffn_gate.weightQ4_K[4608 36864]
-
blk.30.ffn_up.weightQ4_K[4608 36864]
-
blk.30.post_attention_norm.weightF32[4608]
-
blk.30.post_ffw_norm.weightF32[4608]
-
blk.30.ffn_norm.weightF32[4608]
-
blk.30.attn_k.weightQ4_K[4608 2048]
-
blk.30.attn_output.weightQ4_K[4096 4608]
-
blk.30.attn_q.weightQ4_K[4608 4096]
-
blk.30.attn_v.weightQ4_K[4608 2048]
-
blk.31.attn_norm.weightF32[4608]
-
blk.31.ffn_down.weightQ6_K[36864 4608]
-
blk.31.ffn_gate.weightQ4_K[4608 36864]
-
blk.31.ffn_up.weightQ4_K[4608 36864]
-
blk.31.post_attention_norm.weightF32[4608]
-
blk.31.post_ffw_norm.weightF32[4608]
-
blk.31.ffn_norm.weightF32[4608]
-
blk.31.attn_k.weightQ4_K[4608 2048]
-
blk.31.attn_output.weightQ4_K[4096 4608]
-
blk.31.attn_q.weightQ4_K[4608 4096]
-
blk.31.attn_v.weightQ6_K[4608 2048]
-
blk.32.ffn_gate.weightQ4_K[4608 36864]
-
blk.32.attn_k.weightQ4_K[4608 2048]
-
blk.32.attn_output.weightQ4_K[4096 4608]
-
blk.32.attn_q.weightQ4_K[4608 4096]
-
blk.32.attn_v.weightQ4_K[4608 2048]
-
blk.32.attn_norm.weightF32[4608]
-
blk.32.ffn_down.weightQ4_K[36864 4608]
-
blk.32.ffn_up.weightQ4_K[4608 36864]
-
blk.32.post_attention_norm.weightF32[4608]
-
blk.32.post_ffw_norm.weightF32[4608]
-
blk.32.ffn_norm.weightF32[4608]
-
blk.33.attn_norm.weightF32[4608]
-
blk.33.ffn_down.weightQ4_K[36864 4608]
-
blk.33.ffn_gate.weightQ4_K[4608 36864]
-
blk.33.ffn_up.weightQ4_K[4608 36864]
-
blk.33.post_attention_norm.weightF32[4608]
-
blk.33.post_ffw_norm.weightF32[4608]
-
blk.33.ffn_norm.weightF32[4608]
-
blk.33.attn_k.weightQ4_K[4608 2048]
-
blk.33.attn_output.weightQ4_K[4096 4608]
-
blk.33.attn_q.weightQ4_K[4608 4096]
-
blk.33.attn_v.weightQ4_K[4608 2048]
-
blk.34.attn_norm.weightF32[4608]
-
blk.34.ffn_down.weightQ6_K[36864 4608]
-
blk.34.ffn_gate.weightQ4_K[4608 36864]
-
blk.34.ffn_up.weightQ4_K[4608 36864]
-
blk.34.post_attention_norm.weightF32[4608]
-
blk.34.post_ffw_norm.weightF32[4608]
-
blk.34.ffn_norm.weightF32[4608]
-
blk.34.attn_k.weightQ4_K[4608 2048]
-
blk.34.attn_output.weightQ4_K[4096 4608]
-
blk.34.attn_q.weightQ4_K[4608 4096]
-
blk.34.attn_v.weightQ6_K[4608 2048]
-
blk.35.attn_norm.weightF32[4608]
-
blk.35.ffn_down.weightQ4_K[36864 4608]
-
blk.35.ffn_gate.weightQ4_K[4608 36864]
-
blk.35.ffn_up.weightQ4_K[4608 36864]
-
blk.35.post_attention_norm.weightF32[4608]
-
blk.35.post_ffw_norm.weightF32[4608]
-
blk.35.ffn_norm.weightF32[4608]
-
blk.35.attn_k.weightQ4_K[4608 2048]
-
blk.35.attn_output.weightQ4_K[4096 4608]
-
blk.35.attn_q.weightQ4_K[4608 4096]
-
blk.35.attn_v.weightQ4_K[4608 2048]
-
blk.36.ffn_gate.weightQ4_K[4608 36864]
-
blk.36.ffn_up.weightQ4_K[4608 36864]
-
blk.36.attn_k.weightQ4_K[4608 2048]
-
blk.36.attn_output.weightQ4_K[4096 4608]
-
blk.36.attn_q.weightQ4_K[4608 4096]
-
blk.36.attn_v.weightQ4_K[4608 2048]
-
blk.36.attn_norm.weightF32[4608]
-
blk.36.ffn_down.weightQ4_K[36864 4608]
-
blk.36.post_attention_norm.weightF32[4608]
-
blk.36.post_ffw_norm.weightF32[4608]
-
blk.36.ffn_norm.weightF32[4608]
-
blk.37.attn_norm.weightF32[4608]
-
blk.37.ffn_down.weightQ6_K[36864 4608]
-
blk.37.ffn_gate.weightQ4_K[4608 36864]
-
blk.37.ffn_up.weightQ4_K[4608 36864]
-
blk.37.post_attention_norm.weightF32[4608]
-
blk.37.post_ffw_norm.weightF32[4608]
-
blk.37.ffn_norm.weightF32[4608]
-
blk.37.attn_k.weightQ4_K[4608 2048]
-
blk.37.attn_output.weightQ4_K[4096 4608]
-
blk.37.attn_q.weightQ4_K[4608 4096]
-
blk.37.attn_v.weightQ6_K[4608 2048]
-
blk.38.attn_norm.weightF32[4608]
-
blk.38.ffn_down.weightQ4_K[36864 4608]
-
blk.38.ffn_gate.weightQ4_K[4608 36864]
-
blk.38.ffn_up.weightQ4_K[4608 36864]
-
blk.38.post_attention_norm.weightF32[4608]
-
blk.38.post_ffw_norm.weightF32[4608]
-
blk.38.ffn_norm.weightF32[4608]
-
blk.38.attn_k.weightQ4_K[4608 2048]
-
blk.38.attn_output.weightQ4_K[4096 4608]
-
blk.38.attn_q.weightQ4_K[4608 4096]
-
blk.38.attn_v.weightQ4_K[4608 2048]
-
blk.39.attn_norm.weightF32[4608]
-
blk.39.ffn_down.weightQ4_K[36864 4608]
-
blk.39.ffn_gate.weightQ4_K[4608 36864]
-
blk.39.ffn_up.weightQ4_K[4608 36864]
-
blk.39.post_attention_norm.weightF32[4608]
-
blk.39.post_ffw_norm.weightF32[4608]
-
blk.39.ffn_norm.weightF32[4608]
-
blk.39.attn_k.weightQ4_K[4608 2048]
-
blk.39.attn_output.weightQ4_K[4096 4608]
-
blk.39.attn_q.weightQ4_K[4608 4096]
-
blk.39.attn_v.weightQ4_K[4608 2048]
-
blk.40.attn_norm.weightF32[4608]
-
blk.40.ffn_down.weightQ6_K[36864 4608]
-
blk.40.ffn_gate.weightQ4_K[4608 36864]
-
blk.40.ffn_up.weightQ4_K[4608 36864]
-
blk.40.post_attention_norm.weightF32[4608]
-
blk.40.post_ffw_norm.weightF32[4608]
-
blk.40.ffn_norm.weightF32[4608]
-
blk.40.attn_k.weightQ4_K[4608 2048]
-
blk.40.attn_output.weightQ4_K[4096 4608]
-
blk.40.attn_q.weightQ4_K[4608 4096]
-
blk.40.attn_v.weightQ6_K[4608 2048]
-
blk.41.attn_k.weightQ4_K[4608 2048]
-
blk.41.attn_output.weightQ4_K[4096 4608]
-
blk.41.attn_q.weightQ4_K[4608 4096]
-
blk.41.attn_v.weightQ6_K[4608 2048]
-
blk.41.attn_norm.weightF32[4608]
-
blk.41.ffn_down.weightQ6_K[36864 4608]
-
blk.41.ffn_gate.weightQ4_K[4608 36864]
-
blk.41.ffn_up.weightQ4_K[4608 36864]
-
blk.41.post_attention_norm.weightF32[4608]
-
blk.41.post_ffw_norm.weightF32[4608]
-
blk.41.ffn_norm.weightF32[4608]
-
blk.42.attn_norm.weightF32[4608]
-
blk.42.ffn_down.weightQ6_K[36864 4608]
-
blk.42.ffn_gate.weightQ4_K[4608 36864]
-
blk.42.ffn_up.weightQ4_K[4608 36864]
-
blk.42.post_attention_norm.weightF32[4608]
-
blk.42.post_ffw_norm.weightF32[4608]
-
blk.42.ffn_norm.weightF32[4608]
-
blk.42.attn_k.weightQ4_K[4608 2048]
-
blk.42.attn_output.weightQ4_K[4096 4608]
-
blk.42.attn_q.weightQ4_K[4608 4096]
-
blk.42.attn_v.weightQ6_K[4608 2048]
-
blk.43.attn_norm.weightF32[4608]
-
blk.43.ffn_down.weightQ6_K[36864 4608]
-
blk.43.ffn_gate.weightQ4_K[4608 36864]
-
blk.43.ffn_up.weightQ4_K[4608 36864]
-
blk.43.post_attention_norm.weightF32[4608]
-
blk.43.post_ffw_norm.weightF32[4608]
-
blk.43.ffn_norm.weightF32[4608]
-
blk.43.attn_k.weightQ4_K[4608 2048]
-
blk.43.attn_output.weightQ4_K[4096 4608]
-
blk.43.attn_q.weightQ4_K[4608 4096]
-
blk.43.attn_v.weightQ6_K[4608 2048]
-
blk.44.attn_norm.weightF32[4608]
-
blk.44.ffn_down.weightQ6_K[36864 4608]
-
blk.44.ffn_gate.weightQ4_K[4608 36864]
-
blk.44.ffn_up.weightQ4_K[4608 36864]
-
blk.44.post_attention_norm.weightF32[4608]
-
blk.44.post_ffw_norm.weightF32[4608]
-
blk.44.ffn_norm.weightF32[4608]
-
blk.44.attn_k.weightQ4_K[4608 2048]
-
blk.44.attn_output.weightQ4_K[4096 4608]
-
blk.44.attn_q.weightQ4_K[4608 4096]
-
blk.44.attn_v.weightQ6_K[4608 2048]
-
blk.45.ffn_gate.weightQ4_K[4608 36864]
-
blk.45.attn_k.weightQ4_K[4608 2048]
-
blk.45.attn_output.weightQ4_K[4096 4608]
-
blk.45.attn_q.weightQ4_K[4608 4096]
-
blk.45.attn_v.weightQ6_K[4608 2048]
-
blk.45.attn_norm.weightF32[4608]
-
blk.45.ffn_down.weightQ6_K[36864 4608]
-
blk.45.ffn_up.weightQ4_K[4608 36864]
-
blk.45.post_attention_norm.weightF32[4608]
-
blk.45.post_ffw_norm.weightF32[4608]
-
blk.45.ffn_norm.weightF32[4608]
-
output_norm.weightF32[4608]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45