27b
29GB
Google gemma-2-27b-it korean finetuned model with SFT->DPO
27B
21 Pulls Updated 5 weeks ago
e573544eae5b · 29GB
-
general.architecturegemma2
-
general.file_typeQ8_0
-
gemma2.attention.head_count32
-
gemma2.attention.head_count_kv16
-
gemma2.attention.key_length128
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length128
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count46
-
gemma2.context_length8192
-
gemma2.embedding_length4608
-
gemma2.feed_forward_length36864
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id1
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ8_0[4608 256000]
-
blk.0.attn_norm.weightF32[4608]
-
blk.0.ffn_down.weightQ8_0[36864 4608]
-
blk.0.ffn_gate.weightQ8_0[4608 36864]
-
blk.0.ffn_up.weightQ8_0[4608 36864]
-
blk.0.post_attention_norm.weightF32[4608]
-
blk.0.post_ffw_norm.weightF32[4608]
-
blk.0.ffn_norm.weightF32[4608]
-
blk.0.attn_k.weightQ8_0[4608 2048]
-
blk.0.attn_output.weightQ8_0[4096 4608]
-
blk.0.attn_q.weightQ8_0[4608 4096]
-
blk.0.attn_v.weightQ8_0[4608 2048]
-
blk.1.attn_norm.weightF32[4608]
-
blk.1.ffn_down.weightQ8_0[36864 4608]
-
blk.1.ffn_gate.weightQ8_0[4608 36864]
-
blk.1.ffn_up.weightQ8_0[4608 36864]
-
blk.1.post_attention_norm.weightF32[4608]
-
blk.1.post_ffw_norm.weightF32[4608]
-
blk.1.ffn_norm.weightF32[4608]
-
blk.1.attn_k.weightQ8_0[4608 2048]
-
blk.1.attn_output.weightQ8_0[4096 4608]
-
blk.1.attn_q.weightQ8_0[4608 4096]
-
blk.1.attn_v.weightQ8_0[4608 2048]
-
blk.2.attn_k.weightQ8_0[4608 2048]
-
blk.2.attn_output.weightQ8_0[4096 4608]
-
blk.2.attn_q.weightQ8_0[4608 4096]
-
blk.2.attn_v.weightQ8_0[4608 2048]
-
blk.2.attn_norm.weightF32[4608]
-
blk.2.ffn_down.weightQ8_0[36864 4608]
-
blk.2.ffn_gate.weightQ8_0[4608 36864]
-
blk.2.ffn_up.weightQ8_0[4608 36864]
-
blk.2.post_attention_norm.weightF32[4608]
-
blk.2.post_ffw_norm.weightF32[4608]
-
blk.2.ffn_norm.weightF32[4608]
-
blk.3.attn_norm.weightF32[4608]
-
blk.3.ffn_down.weightQ8_0[36864 4608]
-
blk.3.ffn_gate.weightQ8_0[4608 36864]
-
blk.3.ffn_up.weightQ8_0[4608 36864]
-
blk.3.post_attention_norm.weightF32[4608]
-
blk.3.post_ffw_norm.weightF32[4608]
-
blk.3.ffn_norm.weightF32[4608]
-
blk.3.attn_k.weightQ8_0[4608 2048]
-
blk.3.attn_output.weightQ8_0[4096 4608]
-
blk.3.attn_q.weightQ8_0[4608 4096]
-
blk.3.attn_v.weightQ8_0[4608 2048]
-
blk.4.attn_norm.weightF32[4608]
-
blk.4.ffn_down.weightQ8_0[36864 4608]
-
blk.4.ffn_gate.weightQ8_0[4608 36864]
-
blk.4.ffn_up.weightQ8_0[4608 36864]
-
blk.4.post_attention_norm.weightF32[4608]
-
blk.4.post_ffw_norm.weightF32[4608]
-
blk.4.ffn_norm.weightF32[4608]
-
blk.4.attn_k.weightQ8_0[4608 2048]
-
blk.4.attn_output.weightQ8_0[4096 4608]
-
blk.4.attn_q.weightQ8_0[4608 4096]
-
blk.4.attn_v.weightQ8_0[4608 2048]
-
blk.5.attn_norm.weightF32[4608]
-
blk.5.ffn_down.weightQ8_0[36864 4608]
-
blk.5.ffn_gate.weightQ8_0[4608 36864]
-
blk.5.ffn_up.weightQ8_0[4608 36864]
-
blk.5.post_attention_norm.weightF32[4608]
-
blk.5.post_ffw_norm.weightF32[4608]
-
blk.5.ffn_norm.weightF32[4608]
-
blk.5.attn_k.weightQ8_0[4608 2048]
-
blk.5.attn_output.weightQ8_0[4096 4608]
-
blk.5.attn_q.weightQ8_0[4608 4096]
-
blk.5.attn_v.weightQ8_0[4608 2048]
-
blk.6.ffn_gate.weightQ8_0[4608 36864]
-
blk.6.attn_k.weightQ8_0[4608 2048]
-
blk.6.attn_output.weightQ8_0[4096 4608]
-
blk.6.attn_q.weightQ8_0[4608 4096]
-
blk.6.attn_v.weightQ8_0[4608 2048]
-
blk.6.attn_norm.weightF32[4608]
-
blk.6.ffn_down.weightQ8_0[36864 4608]
-
blk.6.ffn_up.weightQ8_0[4608 36864]
-
blk.6.post_attention_norm.weightF32[4608]
-
blk.6.post_ffw_norm.weightF32[4608]
-
blk.6.ffn_norm.weightF32[4608]
-
blk.7.attn_norm.weightF32[4608]
-
blk.7.ffn_down.weightQ8_0[36864 4608]
-
blk.7.ffn_gate.weightQ8_0[4608 36864]
-
blk.7.ffn_up.weightQ8_0[4608 36864]
-
blk.7.post_attention_norm.weightF32[4608]
-
blk.7.post_ffw_norm.weightF32[4608]
-
blk.7.ffn_norm.weightF32[4608]
-
blk.7.attn_k.weightQ8_0[4608 2048]
-
blk.7.attn_output.weightQ8_0[4096 4608]
-
blk.7.attn_q.weightQ8_0[4608 4096]
-
blk.7.attn_v.weightQ8_0[4608 2048]
-
blk.8.attn_norm.weightF32[4608]
-
blk.8.ffn_down.weightQ8_0[36864 4608]
-
blk.8.ffn_gate.weightQ8_0[4608 36864]
-
blk.8.ffn_up.weightQ8_0[4608 36864]
-
blk.8.post_attention_norm.weightF32[4608]
-
blk.8.post_ffw_norm.weightF32[4608]
-
blk.8.ffn_norm.weightF32[4608]
-
blk.8.attn_k.weightQ8_0[4608 2048]
-
blk.8.attn_output.weightQ8_0[4096 4608]
-
blk.8.attn_q.weightQ8_0[4608 4096]
-
blk.8.attn_v.weightQ8_0[4608 2048]
-
blk.9.attn_norm.weightF32[4608]
-
blk.9.ffn_down.weightQ8_0[36864 4608]
-
blk.9.ffn_gate.weightQ8_0[4608 36864]
-
blk.9.ffn_up.weightQ8_0[4608 36864]
-
blk.9.post_attention_norm.weightF32[4608]
-
blk.9.post_ffw_norm.weightF32[4608]
-
blk.9.ffn_norm.weightF32[4608]
-
blk.9.attn_k.weightQ8_0[4608 2048]
-
blk.9.attn_output.weightQ8_0[4096 4608]
-
blk.9.attn_q.weightQ8_0[4608 4096]
-
blk.9.attn_v.weightQ8_0[4608 2048]
-
blk.10.ffn_gate.weightQ8_0[4608 36864]
-
blk.10.ffn_up.weightQ8_0[4608 36864]
-
blk.10.attn_k.weightQ8_0[4608 2048]
-
blk.10.attn_output.weightQ8_0[4096 4608]
-
blk.10.attn_q.weightQ8_0[4608 4096]
-
blk.10.attn_v.weightQ8_0[4608 2048]
-
blk.10.attn_norm.weightF32[4608]
-
blk.10.ffn_down.weightQ8_0[36864 4608]
-
blk.10.post_attention_norm.weightF32[4608]
-
blk.10.post_ffw_norm.weightF32[4608]
-
blk.10.ffn_norm.weightF32[4608]
-
blk.11.attn_norm.weightF32[4608]
-
blk.11.ffn_down.weightQ8_0[36864 4608]
-
blk.11.ffn_gate.weightQ8_0[4608 36864]
-
blk.11.ffn_up.weightQ8_0[4608 36864]
-
blk.11.post_attention_norm.weightF32[4608]
-
blk.11.post_ffw_norm.weightF32[4608]
-
blk.11.ffn_norm.weightF32[4608]
-
blk.11.attn_k.weightQ8_0[4608 2048]
-
blk.11.attn_output.weightQ8_0[4096 4608]
-
blk.11.attn_q.weightQ8_0[4608 4096]
-
blk.11.attn_v.weightQ8_0[4608 2048]
-
blk.12.attn_norm.weightF32[4608]
-
blk.12.ffn_down.weightQ8_0[36864 4608]
-
blk.12.ffn_gate.weightQ8_0[4608 36864]
-
blk.12.ffn_up.weightQ8_0[4608 36864]
-
blk.12.post_attention_norm.weightF32[4608]
-
blk.12.post_ffw_norm.weightF32[4608]
-
blk.12.ffn_norm.weightF32[4608]
-
blk.12.attn_k.weightQ8_0[4608 2048]
-
blk.12.attn_output.weightQ8_0[4096 4608]
-
blk.12.attn_q.weightQ8_0[4608 4096]
-
blk.12.attn_v.weightQ8_0[4608 2048]
-
blk.13.attn_norm.weightF32[4608]
-
blk.13.ffn_down.weightQ8_0[36864 4608]
-
blk.13.ffn_gate.weightQ8_0[4608 36864]
-
blk.13.ffn_up.weightQ8_0[4608 36864]
-
blk.13.post_attention_norm.weightF32[4608]
-
blk.13.post_ffw_norm.weightF32[4608]
-
blk.13.ffn_norm.weightF32[4608]
-
blk.13.attn_k.weightQ8_0[4608 2048]
-
blk.13.attn_output.weightQ8_0[4096 4608]
-
blk.13.attn_q.weightQ8_0[4608 4096]
-
blk.13.attn_v.weightQ8_0[4608 2048]
-
blk.14.attn_norm.weightF32[4608]
-
blk.14.ffn_down.weightQ8_0[36864 4608]
-
blk.14.ffn_gate.weightQ8_0[4608 36864]
-
blk.14.ffn_up.weightQ8_0[4608 36864]
-
blk.14.post_attention_norm.weightF32[4608]
-
blk.14.post_ffw_norm.weightF32[4608]
-
blk.14.ffn_norm.weightF32[4608]
-
blk.14.attn_k.weightQ8_0[4608 2048]
-
blk.14.attn_output.weightQ8_0[4096 4608]
-
blk.14.attn_q.weightQ8_0[4608 4096]
-
blk.14.attn_v.weightQ8_0[4608 2048]
-
blk.15.attn_k.weightQ8_0[4608 2048]
-
blk.15.attn_output.weightQ8_0[4096 4608]
-
blk.15.attn_q.weightQ8_0[4608 4096]
-
blk.15.attn_v.weightQ8_0[4608 2048]
-
blk.15.attn_norm.weightF32[4608]
-
blk.15.ffn_down.weightQ8_0[36864 4608]
-
blk.15.ffn_gate.weightQ8_0[4608 36864]
-
blk.15.ffn_up.weightQ8_0[4608 36864]
-
blk.15.post_attention_norm.weightF32[4608]
-
blk.15.post_ffw_norm.weightF32[4608]
-
blk.15.ffn_norm.weightF32[4608]
-
blk.16.attn_norm.weightF32[4608]
-
blk.16.ffn_down.weightQ8_0[36864 4608]
-
blk.16.ffn_gate.weightQ8_0[4608 36864]
-
blk.16.ffn_up.weightQ8_0[4608 36864]
-
blk.16.post_attention_norm.weightF32[4608]
-
blk.16.post_ffw_norm.weightF32[4608]
-
blk.16.ffn_norm.weightF32[4608]
-
blk.16.attn_k.weightQ8_0[4608 2048]
-
blk.16.attn_output.weightQ8_0[4096 4608]
-
blk.16.attn_q.weightQ8_0[4608 4096]
-
blk.16.attn_v.weightQ8_0[4608 2048]
-
blk.17.attn_norm.weightF32[4608]
-
blk.17.ffn_down.weightQ8_0[36864 4608]
-
blk.17.ffn_gate.weightQ8_0[4608 36864]
-
blk.17.ffn_up.weightQ8_0[4608 36864]
-
blk.17.post_attention_norm.weightF32[4608]
-
blk.17.post_ffw_norm.weightF32[4608]
-
blk.17.ffn_norm.weightF32[4608]
-
blk.17.attn_k.weightQ8_0[4608 2048]
-
blk.17.attn_output.weightQ8_0[4096 4608]
-
blk.17.attn_q.weightQ8_0[4608 4096]
-
blk.17.attn_v.weightQ8_0[4608 2048]
-
blk.18.attn_norm.weightF32[4608]
-
blk.18.ffn_down.weightQ8_0[36864 4608]
-
blk.18.ffn_gate.weightQ8_0[4608 36864]
-
blk.18.ffn_up.weightQ8_0[4608 36864]
-
blk.18.post_attention_norm.weightF32[4608]
-
blk.18.post_ffw_norm.weightF32[4608]
-
blk.18.ffn_norm.weightF32[4608]
-
blk.18.attn_k.weightQ8_0[4608 2048]
-
blk.18.attn_output.weightQ8_0[4096 4608]
-
blk.18.attn_q.weightQ8_0[4608 4096]
-
blk.18.attn_v.weightQ8_0[4608 2048]
-
blk.19.ffn_gate.weightQ8_0[4608 36864]
-
blk.19.attn_k.weightQ8_0[4608 2048]
-
blk.19.attn_output.weightQ8_0[4096 4608]
-
blk.19.attn_q.weightQ8_0[4608 4096]
-
blk.19.attn_v.weightQ8_0[4608 2048]
-
blk.19.attn_norm.weightF32[4608]
-
blk.19.ffn_down.weightQ8_0[36864 4608]
-
blk.19.ffn_up.weightQ8_0[4608 36864]
-
blk.19.post_attention_norm.weightF32[4608]
-
blk.19.post_ffw_norm.weightF32[4608]
-
blk.19.ffn_norm.weightF32[4608]
-
blk.20.attn_norm.weightF32[4608]
-
blk.20.ffn_down.weightQ8_0[36864 4608]
-
blk.20.ffn_gate.weightQ8_0[4608 36864]
-
blk.20.ffn_up.weightQ8_0[4608 36864]
-
blk.20.post_attention_norm.weightF32[4608]
-
blk.20.post_ffw_norm.weightF32[4608]
-
blk.20.ffn_norm.weightF32[4608]
-
blk.20.attn_k.weightQ8_0[4608 2048]
-
blk.20.attn_output.weightQ8_0[4096 4608]
-
blk.20.attn_q.weightQ8_0[4608 4096]
-
blk.20.attn_v.weightQ8_0[4608 2048]
-
blk.21.attn_norm.weightF32[4608]
-
blk.21.ffn_down.weightQ8_0[36864 4608]
-
blk.21.ffn_gate.weightQ8_0[4608 36864]
-
blk.21.ffn_up.weightQ8_0[4608 36864]
-
blk.21.post_attention_norm.weightF32[4608]
-
blk.21.post_ffw_norm.weightF32[4608]
-
blk.21.ffn_norm.weightF32[4608]
-
blk.21.attn_k.weightQ8_0[4608 2048]
-
blk.21.attn_output.weightQ8_0[4096 4608]
-
blk.21.attn_q.weightQ8_0[4608 4096]
-
blk.21.attn_v.weightQ8_0[4608 2048]
-
blk.22.attn_norm.weightF32[4608]
-
blk.22.ffn_down.weightQ8_0[36864 4608]
-
blk.22.ffn_gate.weightQ8_0[4608 36864]
-
blk.22.ffn_up.weightQ8_0[4608 36864]
-
blk.22.post_attention_norm.weightF32[4608]
-
blk.22.post_ffw_norm.weightF32[4608]
-
blk.22.ffn_norm.weightF32[4608]
-
blk.22.attn_k.weightQ8_0[4608 2048]
-
blk.22.attn_output.weightQ8_0[4096 4608]
-
blk.22.attn_q.weightQ8_0[4608 4096]
-
blk.22.attn_v.weightQ8_0[4608 2048]
-
blk.23.ffn_gate.weightQ8_0[4608 36864]
-
blk.23.ffn_up.weightQ8_0[4608 36864]
-
blk.23.attn_k.weightQ8_0[4608 2048]
-
blk.23.attn_output.weightQ8_0[4096 4608]
-
blk.23.attn_q.weightQ8_0[4608 4096]
-
blk.23.attn_v.weightQ8_0[4608 2048]
-
blk.23.attn_norm.weightF32[4608]
-
blk.23.ffn_down.weightQ8_0[36864 4608]
-
blk.23.post_attention_norm.weightF32[4608]
-
blk.23.post_ffw_norm.weightF32[4608]
-
blk.23.ffn_norm.weightF32[4608]
-
blk.24.attn_norm.weightF32[4608]
-
blk.24.ffn_down.weightQ8_0[36864 4608]
-
blk.24.ffn_gate.weightQ8_0[4608 36864]
-
blk.24.ffn_up.weightQ8_0[4608 36864]
-
blk.24.post_attention_norm.weightF32[4608]
-
blk.24.post_ffw_norm.weightF32[4608]
-
blk.24.ffn_norm.weightF32[4608]
-
blk.24.attn_k.weightQ8_0[4608 2048]
-
blk.24.attn_output.weightQ8_0[4096 4608]
-
blk.24.attn_q.weightQ8_0[4608 4096]
-
blk.24.attn_v.weightQ8_0[4608 2048]
-
blk.25.attn_norm.weightF32[4608]
-
blk.25.ffn_down.weightQ8_0[36864 4608]
-
blk.25.ffn_gate.weightQ8_0[4608 36864]
-
blk.25.ffn_up.weightQ8_0[4608 36864]
-
blk.25.post_attention_norm.weightF32[4608]
-
blk.25.post_ffw_norm.weightF32[4608]
-
blk.25.ffn_norm.weightF32[4608]
-
blk.25.attn_k.weightQ8_0[4608 2048]
-
blk.25.attn_output.weightQ8_0[4096 4608]
-
blk.25.attn_q.weightQ8_0[4608 4096]
-
blk.25.attn_v.weightQ8_0[4608 2048]
-
blk.26.attn_norm.weightF32[4608]
-
blk.26.ffn_down.weightQ8_0[36864 4608]
-
blk.26.ffn_gate.weightQ8_0[4608 36864]
-
blk.26.ffn_up.weightQ8_0[4608 36864]
-
blk.26.post_attention_norm.weightF32[4608]
-
blk.26.post_ffw_norm.weightF32[4608]
-
blk.26.ffn_norm.weightF32[4608]
-
blk.26.attn_k.weightQ8_0[4608 2048]
-
blk.26.attn_output.weightQ8_0[4096 4608]
-
blk.26.attn_q.weightQ8_0[4608 4096]
-
blk.26.attn_v.weightQ8_0[4608 2048]
-
blk.27.attn_norm.weightF32[4608]
-
blk.27.ffn_down.weightQ8_0[36864 4608]
-
blk.27.ffn_gate.weightQ8_0[4608 36864]
-
blk.27.ffn_up.weightQ8_0[4608 36864]
-
blk.27.post_attention_norm.weightF32[4608]
-
blk.27.post_ffw_norm.weightF32[4608]
-
blk.27.ffn_norm.weightF32[4608]
-
blk.27.attn_k.weightQ8_0[4608 2048]
-
blk.27.attn_output.weightQ8_0[4096 4608]
-
blk.27.attn_q.weightQ8_0[4608 4096]
-
blk.27.attn_v.weightQ8_0[4608 2048]
-
blk.28.attn_k.weightQ8_0[4608 2048]
-
blk.28.attn_output.weightQ8_0[4096 4608]
-
blk.28.attn_q.weightQ8_0[4608 4096]
-
blk.28.attn_v.weightQ8_0[4608 2048]
-
blk.28.attn_norm.weightF32[4608]
-
blk.28.ffn_down.weightQ8_0[36864 4608]
-
blk.28.ffn_gate.weightQ8_0[4608 36864]
-
blk.28.ffn_up.weightQ8_0[4608 36864]
-
blk.28.post_attention_norm.weightF32[4608]
-
blk.28.post_ffw_norm.weightF32[4608]
-
blk.28.ffn_norm.weightF32[4608]
-
blk.29.attn_norm.weightF32[4608]
-
blk.29.ffn_down.weightQ8_0[36864 4608]
-
blk.29.ffn_gate.weightQ8_0[4608 36864]
-
blk.29.ffn_up.weightQ8_0[4608 36864]
-
blk.29.post_attention_norm.weightF32[4608]
-
blk.29.post_ffw_norm.weightF32[4608]
-
blk.29.ffn_norm.weightF32[4608]
-
blk.29.attn_k.weightQ8_0[4608 2048]
-
blk.29.attn_output.weightQ8_0[4096 4608]
-
blk.29.attn_q.weightQ8_0[4608 4096]
-
blk.29.attn_v.weightQ8_0[4608 2048]
-
blk.30.attn_norm.weightF32[4608]
-
blk.30.ffn_down.weightQ8_0[36864 4608]
-
blk.30.ffn_gate.weightQ8_0[4608 36864]
-
blk.30.ffn_up.weightQ8_0[4608 36864]
-
blk.30.post_attention_norm.weightF32[4608]
-
blk.30.post_ffw_norm.weightF32[4608]
-
blk.30.ffn_norm.weightF32[4608]
-
blk.30.attn_k.weightQ8_0[4608 2048]
-
blk.30.attn_output.weightQ8_0[4096 4608]
-
blk.30.attn_q.weightQ8_0[4608 4096]
-
blk.30.attn_v.weightQ8_0[4608 2048]
-
blk.31.attn_norm.weightF32[4608]
-
blk.31.ffn_down.weightQ8_0[36864 4608]
-
blk.31.ffn_gate.weightQ8_0[4608 36864]
-
blk.31.ffn_up.weightQ8_0[4608 36864]
-
blk.31.post_attention_norm.weightF32[4608]
-
blk.31.post_ffw_norm.weightF32[4608]
-
blk.31.ffn_norm.weightF32[4608]
-
blk.31.attn_k.weightQ8_0[4608 2048]
-
blk.31.attn_output.weightQ8_0[4096 4608]
-
blk.31.attn_q.weightQ8_0[4608 4096]
-
blk.31.attn_v.weightQ8_0[4608 2048]
-
blk.32.ffn_gate.weightQ8_0[4608 36864]
-
blk.32.attn_k.weightQ8_0[4608 2048]
-
blk.32.attn_output.weightQ8_0[4096 4608]
-
blk.32.attn_q.weightQ8_0[4608 4096]
-
blk.32.attn_v.weightQ8_0[4608 2048]
-
blk.32.attn_norm.weightF32[4608]
-
blk.32.ffn_down.weightQ8_0[36864 4608]
-
blk.32.ffn_up.weightQ8_0[4608 36864]
-
blk.32.post_attention_norm.weightF32[4608]
-
blk.32.post_ffw_norm.weightF32[4608]
-
blk.32.ffn_norm.weightF32[4608]
-
blk.33.attn_norm.weightF32[4608]
-
blk.33.ffn_down.weightQ8_0[36864 4608]
-
blk.33.ffn_gate.weightQ8_0[4608 36864]
-
blk.33.ffn_up.weightQ8_0[4608 36864]
-
blk.33.post_attention_norm.weightF32[4608]
-
blk.33.post_ffw_norm.weightF32[4608]
-
blk.33.ffn_norm.weightF32[4608]
-
blk.33.attn_k.weightQ8_0[4608 2048]
-
blk.33.attn_output.weightQ8_0[4096 4608]
-
blk.33.attn_q.weightQ8_0[4608 4096]
-
blk.33.attn_v.weightQ8_0[4608 2048]
-
blk.34.attn_norm.weightF32[4608]
-
blk.34.ffn_down.weightQ8_0[36864 4608]
-
blk.34.ffn_gate.weightQ8_0[4608 36864]
-
blk.34.ffn_up.weightQ8_0[4608 36864]
-
blk.34.post_attention_norm.weightF32[4608]
-
blk.34.post_ffw_norm.weightF32[4608]
-
blk.34.ffn_norm.weightF32[4608]
-
blk.34.attn_k.weightQ8_0[4608 2048]
-
blk.34.attn_output.weightQ8_0[4096 4608]
-
blk.34.attn_q.weightQ8_0[4608 4096]
-
blk.34.attn_v.weightQ8_0[4608 2048]
-
blk.35.attn_norm.weightF32[4608]
-
blk.35.ffn_down.weightQ8_0[36864 4608]
-
blk.35.ffn_gate.weightQ8_0[4608 36864]
-
blk.35.ffn_up.weightQ8_0[4608 36864]
-
blk.35.post_attention_norm.weightF32[4608]
-
blk.35.post_ffw_norm.weightF32[4608]
-
blk.35.ffn_norm.weightF32[4608]
-
blk.35.attn_k.weightQ8_0[4608 2048]
-
blk.35.attn_output.weightQ8_0[4096 4608]
-
blk.35.attn_q.weightQ8_0[4608 4096]
-
blk.35.attn_v.weightQ8_0[4608 2048]
-
blk.36.ffn_gate.weightQ8_0[4608 36864]
-
blk.36.ffn_up.weightQ8_0[4608 36864]
-
blk.36.attn_k.weightQ8_0[4608 2048]
-
blk.36.attn_output.weightQ8_0[4096 4608]
-
blk.36.attn_q.weightQ8_0[4608 4096]
-
blk.36.attn_v.weightQ8_0[4608 2048]
-
blk.36.attn_norm.weightF32[4608]
-
blk.36.ffn_down.weightQ8_0[36864 4608]
-
blk.36.post_attention_norm.weightF32[4608]
-
blk.36.post_ffw_norm.weightF32[4608]
-
blk.36.ffn_norm.weightF32[4608]
-
blk.37.attn_norm.weightF32[4608]
-
blk.37.ffn_down.weightQ8_0[36864 4608]
-
blk.37.ffn_gate.weightQ8_0[4608 36864]
-
blk.37.ffn_up.weightQ8_0[4608 36864]
-
blk.37.post_attention_norm.weightF32[4608]
-
blk.37.post_ffw_norm.weightF32[4608]
-
blk.37.ffn_norm.weightF32[4608]
-
blk.37.attn_k.weightQ8_0[4608 2048]
-
blk.37.attn_output.weightQ8_0[4096 4608]
-
blk.37.attn_q.weightQ8_0[4608 4096]
-
blk.37.attn_v.weightQ8_0[4608 2048]
-
blk.38.attn_norm.weightF32[4608]
-
blk.38.ffn_down.weightQ8_0[36864 4608]
-
blk.38.ffn_gate.weightQ8_0[4608 36864]
-
blk.38.ffn_up.weightQ8_0[4608 36864]
-
blk.38.post_attention_norm.weightF32[4608]
-
blk.38.post_ffw_norm.weightF32[4608]
-
blk.38.ffn_norm.weightF32[4608]
-
blk.38.attn_k.weightQ8_0[4608 2048]
-
blk.38.attn_output.weightQ8_0[4096 4608]
-
blk.38.attn_q.weightQ8_0[4608 4096]
-
blk.38.attn_v.weightQ8_0[4608 2048]
-
blk.39.attn_norm.weightF32[4608]
-
blk.39.ffn_down.weightQ8_0[36864 4608]
-
blk.39.ffn_gate.weightQ8_0[4608 36864]
-
blk.39.ffn_up.weightQ8_0[4608 36864]
-
blk.39.post_attention_norm.weightF32[4608]
-
blk.39.post_ffw_norm.weightF32[4608]
-
blk.39.ffn_norm.weightF32[4608]
-
blk.39.attn_k.weightQ8_0[4608 2048]
-
blk.39.attn_output.weightQ8_0[4096 4608]
-
blk.39.attn_q.weightQ8_0[4608 4096]
-
blk.39.attn_v.weightQ8_0[4608 2048]
-
blk.40.attn_norm.weightF32[4608]
-
blk.40.ffn_down.weightQ8_0[36864 4608]
-
blk.40.ffn_gate.weightQ8_0[4608 36864]
-
blk.40.ffn_up.weightQ8_0[4608 36864]
-
blk.40.post_attention_norm.weightF32[4608]
-
blk.40.post_ffw_norm.weightF32[4608]
-
blk.40.ffn_norm.weightF32[4608]
-
blk.40.attn_k.weightQ8_0[4608 2048]
-
blk.40.attn_output.weightQ8_0[4096 4608]
-
blk.40.attn_q.weightQ8_0[4608 4096]
-
blk.40.attn_v.weightQ8_0[4608 2048]
-
blk.41.attn_k.weightQ8_0[4608 2048]
-
blk.41.attn_output.weightQ8_0[4096 4608]
-
blk.41.attn_q.weightQ8_0[4608 4096]
-
blk.41.attn_v.weightQ8_0[4608 2048]
-
blk.41.attn_norm.weightF32[4608]
-
blk.41.ffn_down.weightQ8_0[36864 4608]
-
blk.41.ffn_gate.weightQ8_0[4608 36864]
-
blk.41.ffn_up.weightQ8_0[4608 36864]
-
blk.41.post_attention_norm.weightF32[4608]
-
blk.41.post_ffw_norm.weightF32[4608]
-
blk.41.ffn_norm.weightF32[4608]
-
blk.42.attn_norm.weightF32[4608]
-
blk.42.ffn_down.weightQ8_0[36864 4608]
-
blk.42.ffn_gate.weightQ8_0[4608 36864]
-
blk.42.ffn_up.weightQ8_0[4608 36864]
-
blk.42.post_attention_norm.weightF32[4608]
-
blk.42.post_ffw_norm.weightF32[4608]
-
blk.42.ffn_norm.weightF32[4608]
-
blk.42.attn_k.weightQ8_0[4608 2048]
-
blk.42.attn_output.weightQ8_0[4096 4608]
-
blk.42.attn_q.weightQ8_0[4608 4096]
-
blk.42.attn_v.weightQ8_0[4608 2048]
-
blk.43.attn_norm.weightF32[4608]
-
blk.43.ffn_down.weightQ8_0[36864 4608]
-
blk.43.ffn_gate.weightQ8_0[4608 36864]
-
blk.43.ffn_up.weightQ8_0[4608 36864]
-
blk.43.post_attention_norm.weightF32[4608]
-
blk.43.post_ffw_norm.weightF32[4608]
-
blk.43.ffn_norm.weightF32[4608]
-
blk.43.attn_k.weightQ8_0[4608 2048]
-
blk.43.attn_output.weightQ8_0[4096 4608]
-
blk.43.attn_q.weightQ8_0[4608 4096]
-
blk.43.attn_v.weightQ8_0[4608 2048]
-
blk.44.attn_norm.weightF32[4608]
-
blk.44.ffn_down.weightQ8_0[36864 4608]
-
blk.44.ffn_gate.weightQ8_0[4608 36864]
-
blk.44.ffn_up.weightQ8_0[4608 36864]
-
blk.44.post_attention_norm.weightF32[4608]
-
blk.44.post_ffw_norm.weightF32[4608]
-
blk.44.ffn_norm.weightF32[4608]
-
blk.44.attn_k.weightQ8_0[4608 2048]
-
blk.44.attn_output.weightQ8_0[4096 4608]
-
blk.44.attn_q.weightQ8_0[4608 4096]
-
blk.44.attn_v.weightQ8_0[4608 2048]
-
blk.45.ffn_gate.weightQ8_0[4608 36864]
-
blk.45.attn_k.weightQ8_0[4608 2048]
-
blk.45.attn_output.weightQ8_0[4096 4608]
-
blk.45.attn_q.weightQ8_0[4608 4096]
-
blk.45.attn_v.weightQ8_0[4608 2048]
-
blk.45.attn_norm.weightF32[4608]
-
blk.45.ffn_down.weightQ8_0[36864 4608]
-
blk.45.ffn_up.weightQ8_0[4608 36864]
-
blk.45.post_attention_norm.weightF32[4608]
-
blk.45.post_ffw_norm.weightF32[4608]
-
blk.45.ffn_norm.weightF32[4608]
-
output_norm.weightF32[4608]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45