An RP model with impressive flexibility.
27B
58 Pulls Updated 7 weeks ago
3588e005ef5b · 17GB
-
general.architecturegemma2
-
general.base_model.0.nameGemmasutra Pro 27B V1E
-
general.base_model.0.organizationBeaverAI
-
general.base_model.0.repo_urlhttps://huggingface.co/BeaverAI/Gemmasutra-Pro-27B-v1e
-
general.base_model.1.nameGemmasutra Pro 27B V1F
-
general.base_model.1.organizationBeaverAI
-
general.base_model.1.repo_urlhttps://huggingface.co/BeaverAI/Gemmasutra-Pro-27B-v1f
-
general.base_model.count2
-
general.file_typeQ4_K_M
-
general.organizationBeaverAI
-
general.quantization_version2
-
gemma2.attention.head_count32
-
gemma2.attention.head_count_kv16
-
gemma2.attention.key_length128
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length128
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count46
-
gemma2.context_length8192
-
gemma2.embedding_length4608
-
gemma2.feed_forward_length36864
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[4608 256000]
-
blk.0.attn_norm.weightF32[4608]
-
blk.0.ffn_down.weightQ6_K[36864 4608]
-
blk.0.ffn_gate.weightQ4_K[4608 36864]
-
blk.0.ffn_up.weightQ4_K[4608 36864]
-
blk.0.post_attention_norm.weightF32[4608]
-
blk.0.post_ffw_norm.weightF32[4608]
-
blk.0.ffn_norm.weightF32[4608]
-
blk.0.attn_k.weightQ4_K[4608 2048]
-
blk.0.attn_output.weightQ4_K[4096 4608]
-
blk.0.attn_q.weightQ4_K[4608 4096]
-
blk.0.attn_v.weightQ6_K[4608 2048]
-
blk.1.attn_norm.weightF32[4608]
-
blk.1.ffn_down.weightQ6_K[36864 4608]
-
blk.1.ffn_gate.weightQ4_K[4608 36864]
-
blk.1.ffn_up.weightQ4_K[4608 36864]
-
blk.1.post_attention_norm.weightF32[4608]
-
blk.1.post_ffw_norm.weightF32[4608]
-
blk.1.ffn_norm.weightF32[4608]
-
blk.1.attn_k.weightQ4_K[4608 2048]
-
blk.1.attn_output.weightQ4_K[4096 4608]
-
blk.1.attn_q.weightQ4_K[4608 4096]
-
blk.1.attn_v.weightQ6_K[4608 2048]
-
blk.2.attn_norm.weightF32[4608]
-
blk.2.ffn_down.weightQ4_K[36864 4608]
-
blk.2.ffn_gate.weightQ4_K[4608 36864]
-
blk.2.ffn_up.weightQ4_K[4608 36864]
-
blk.2.post_attention_norm.weightF32[4608]
-
blk.2.post_ffw_norm.weightF32[4608]
-
blk.2.ffn_norm.weightF32[4608]
-
blk.2.attn_k.weightQ4_K[4608 2048]
-
blk.2.attn_output.weightQ4_K[4096 4608]
-
blk.2.attn_q.weightQ4_K[4608 4096]
-
blk.2.attn_v.weightQ4_K[4608 2048]
-
blk.3.attn_norm.weightF32[4608]
-
blk.3.ffn_down.weightQ4_K[36864 4608]
-
blk.3.ffn_gate.weightQ4_K[4608 36864]
-
blk.3.ffn_up.weightQ4_K[4608 36864]
-
blk.3.post_attention_norm.weightF32[4608]
-
blk.3.post_ffw_norm.weightF32[4608]
-
blk.3.ffn_norm.weightF32[4608]
-
blk.3.attn_k.weightQ4_K[4608 2048]
-
blk.3.attn_output.weightQ4_K[4096 4608]
-
blk.3.attn_q.weightQ4_K[4608 4096]
-
blk.3.attn_v.weightQ4_K[4608 2048]
-
blk.4.attn_norm.weightF32[4608]
-
blk.4.ffn_down.weightQ6_K[36864 4608]
-
blk.4.ffn_gate.weightQ4_K[4608 36864]
-
blk.4.ffn_up.weightQ4_K[4608 36864]
-
blk.4.post_attention_norm.weightF32[4608]
-
blk.4.post_ffw_norm.weightF32[4608]
-
blk.4.ffn_norm.weightF32[4608]
-
blk.4.attn_k.weightQ4_K[4608 2048]
-
blk.4.attn_output.weightQ4_K[4096 4608]
-
blk.4.attn_q.weightQ4_K[4608 4096]
-
blk.4.attn_v.weightQ6_K[4608 2048]
-
blk.5.attn_norm.weightF32[4608]
-
blk.5.ffn_down.weightQ6_K[36864 4608]
-
blk.5.ffn_gate.weightQ4_K[4608 36864]
-
blk.5.ffn_up.weightQ4_K[4608 36864]
-
blk.5.post_attention_norm.weightF32[4608]
-
blk.5.post_ffw_norm.weightF32[4608]
-
blk.5.ffn_norm.weightF32[4608]
-
blk.5.attn_k.weightQ4_K[4608 2048]
-
blk.5.attn_output.weightQ4_K[4096 4608]
-
blk.5.attn_q.weightQ4_K[4608 4096]
-
blk.5.attn_v.weightQ6_K[4608 2048]
-
blk.6.attn_norm.weightF32[4608]
-
blk.6.ffn_down.weightQ6_K[36864 4608]
-
blk.6.ffn_gate.weightQ4_K[4608 36864]
-
blk.6.ffn_up.weightQ4_K[4608 36864]
-
blk.6.post_attention_norm.weightF32[4608]
-
blk.6.post_ffw_norm.weightF32[4608]
-
blk.6.ffn_norm.weightF32[4608]
-
blk.6.attn_k.weightQ4_K[4608 2048]
-
blk.6.attn_output.weightQ4_K[4096 4608]
-
blk.6.attn_q.weightQ4_K[4608 4096]
-
blk.6.attn_v.weightQ6_K[4608 2048]
-
blk.7.attn_norm.weightF32[4608]
-
blk.7.ffn_down.weightQ6_K[36864 4608]
-
blk.7.ffn_gate.weightQ4_K[4608 36864]
-
blk.7.ffn_up.weightQ4_K[4608 36864]
-
blk.7.post_attention_norm.weightF32[4608]
-
blk.7.post_ffw_norm.weightF32[4608]
-
blk.7.ffn_norm.weightF32[4608]
-
blk.7.attn_k.weightQ4_K[4608 2048]
-
blk.7.attn_output.weightQ4_K[4096 4608]
-
blk.7.attn_q.weightQ4_K[4608 4096]
-
blk.7.attn_v.weightQ6_K[4608 2048]
-
blk.8.attn_norm.weightF32[4608]
-
blk.8.ffn_down.weightQ6_K[36864 4608]
-
blk.8.ffn_gate.weightQ4_K[4608 36864]
-
blk.8.ffn_up.weightQ4_K[4608 36864]
-
blk.8.post_attention_norm.weightF32[4608]
-
blk.8.post_ffw_norm.weightF32[4608]
-
blk.8.ffn_norm.weightF32[4608]
-
blk.8.attn_k.weightQ4_K[4608 2048]
-
blk.8.attn_output.weightQ4_K[4096 4608]
-
blk.8.attn_q.weightQ4_K[4608 4096]
-
blk.8.attn_v.weightQ6_K[4608 2048]
-
blk.9.attn_norm.weightF32[4608]
-
blk.9.ffn_down.weightQ6_K[36864 4608]
-
blk.9.ffn_gate.weightQ4_K[4608 36864]
-
blk.9.ffn_up.weightQ4_K[4608 36864]
-
blk.9.post_attention_norm.weightF32[4608]
-
blk.9.post_ffw_norm.weightF32[4608]
-
blk.9.ffn_norm.weightF32[4608]
-
blk.9.attn_k.weightQ4_K[4608 2048]
-
blk.9.attn_output.weightQ4_K[4096 4608]
-
blk.9.attn_q.weightQ4_K[4608 4096]
-
blk.9.attn_v.weightQ6_K[4608 2048]
-
blk.10.attn_norm.weightF32[4608]
-
blk.10.ffn_down.weightQ6_K[36864 4608]
-
blk.10.ffn_gate.weightQ4_K[4608 36864]
-
blk.10.ffn_up.weightQ4_K[4608 36864]
-
blk.10.post_attention_norm.weightF32[4608]
-
blk.10.post_ffw_norm.weightF32[4608]
-
blk.10.ffn_norm.weightF32[4608]
-
blk.10.attn_k.weightQ4_K[4608 2048]
-
blk.10.attn_output.weightQ4_K[4096 4608]
-
blk.10.attn_q.weightQ4_K[4608 4096]
-
blk.10.attn_v.weightQ6_K[4608 2048]
-
blk.11.attn_norm.weightF32[4608]
-
blk.11.ffn_down.weightQ6_K[36864 4608]
-
blk.11.ffn_gate.weightQ4_K[4608 36864]
-
blk.11.ffn_up.weightQ4_K[4608 36864]
-
blk.11.post_attention_norm.weightF32[4608]
-
blk.11.post_ffw_norm.weightF32[4608]
-
blk.11.ffn_norm.weightF32[4608]
-
blk.11.attn_k.weightQ4_K[4608 2048]
-
blk.11.attn_output.weightQ4_K[4096 4608]
-
blk.11.attn_q.weightQ4_K[4608 4096]
-
blk.11.attn_v.weightQ6_K[4608 2048]
-
blk.12.attn_norm.weightF32[4608]
-
blk.12.ffn_down.weightQ6_K[36864 4608]
-
blk.12.ffn_gate.weightQ4_K[4608 36864]
-
blk.12.ffn_up.weightQ4_K[4608 36864]
-
blk.12.post_attention_norm.weightF32[4608]
-
blk.12.post_ffw_norm.weightF32[4608]
-
blk.12.ffn_norm.weightF32[4608]
-
blk.12.attn_k.weightQ4_K[4608 2048]
-
blk.12.attn_output.weightQ4_K[4096 4608]
-
blk.12.attn_q.weightQ4_K[4608 4096]
-
blk.12.attn_v.weightQ6_K[4608 2048]
-
blk.13.attn_norm.weightF32[4608]
-
blk.13.ffn_down.weightQ4_K[36864 4608]
-
blk.13.ffn_gate.weightQ4_K[4608 36864]
-
blk.13.ffn_up.weightQ4_K[4608 36864]
-
blk.13.post_attention_norm.weightF32[4608]
-
blk.13.post_ffw_norm.weightF32[4608]
-
blk.13.ffn_norm.weightF32[4608]
-
blk.13.attn_k.weightQ4_K[4608 2048]
-
blk.13.attn_output.weightQ4_K[4096 4608]
-
blk.13.attn_q.weightQ4_K[4608 4096]
-
blk.13.attn_v.weightQ4_K[4608 2048]
-
blk.14.attn_norm.weightF32[4608]
-
blk.14.ffn_down.weightQ4_K[36864 4608]
-
blk.14.ffn_gate.weightQ4_K[4608 36864]
-
blk.14.ffn_up.weightQ4_K[4608 36864]
-
blk.14.post_attention_norm.weightF32[4608]
-
blk.14.post_ffw_norm.weightF32[4608]
-
blk.14.ffn_norm.weightF32[4608]
-
blk.14.attn_k.weightQ4_K[4608 2048]
-
blk.14.attn_output.weightQ4_K[4096 4608]
-
blk.14.attn_q.weightQ4_K[4608 4096]
-
blk.14.attn_v.weightQ4_K[4608 2048]
-
blk.15.attn_norm.weightF32[4608]
-
blk.15.ffn_down.weightQ6_K[36864 4608]
-
blk.15.ffn_gate.weightQ4_K[4608 36864]
-
blk.15.ffn_up.weightQ4_K[4608 36864]
-
blk.15.post_attention_norm.weightF32[4608]
-
blk.15.post_ffw_norm.weightF32[4608]
-
blk.15.ffn_norm.weightF32[4608]
-
blk.15.attn_k.weightQ4_K[4608 2048]
-
blk.15.attn_output.weightQ4_K[4096 4608]
-
blk.15.attn_q.weightQ4_K[4608 4096]
-
blk.15.attn_v.weightQ6_K[4608 2048]
-
blk.16.attn_norm.weightF32[4608]
-
blk.16.ffn_down.weightQ4_K[36864 4608]
-
blk.16.ffn_gate.weightQ4_K[4608 36864]
-
blk.16.ffn_up.weightQ4_K[4608 36864]
-
blk.16.post_attention_norm.weightF32[4608]
-
blk.16.post_ffw_norm.weightF32[4608]
-
blk.16.ffn_norm.weightF32[4608]
-
blk.16.attn_k.weightQ4_K[4608 2048]
-
blk.16.attn_output.weightQ4_K[4096 4608]
-
blk.16.attn_q.weightQ4_K[4608 4096]
-
blk.16.attn_v.weightQ4_K[4608 2048]
-
blk.17.attn_norm.weightF32[4608]
-
blk.17.ffn_down.weightQ4_K[36864 4608]
-
blk.17.ffn_gate.weightQ4_K[4608 36864]
-
blk.17.ffn_up.weightQ4_K[4608 36864]
-
blk.17.post_attention_norm.weightF32[4608]
-
blk.17.post_ffw_norm.weightF32[4608]
-
blk.17.ffn_norm.weightF32[4608]
-
blk.17.attn_k.weightQ4_K[4608 2048]
-
blk.17.attn_output.weightQ4_K[4096 4608]
-
blk.17.attn_q.weightQ4_K[4608 4096]
-
blk.17.attn_v.weightQ4_K[4608 2048]
-
blk.18.attn_norm.weightF32[4608]
-
blk.18.ffn_down.weightQ6_K[36864 4608]
-
blk.18.ffn_gate.weightQ4_K[4608 36864]
-
blk.18.ffn_up.weightQ4_K[4608 36864]
-
blk.18.post_attention_norm.weightF32[4608]
-
blk.18.post_ffw_norm.weightF32[4608]
-
blk.18.ffn_norm.weightF32[4608]
-
blk.18.attn_k.weightQ4_K[4608 2048]
-
blk.18.attn_output.weightQ4_K[4096 4608]
-
blk.18.attn_q.weightQ4_K[4608 4096]
-
blk.18.attn_v.weightQ6_K[4608 2048]
-
blk.19.attn_norm.weightF32[4608]
-
blk.19.ffn_down.weightQ4_K[36864 4608]
-
blk.19.ffn_gate.weightQ4_K[4608 36864]
-
blk.19.ffn_up.weightQ4_K[4608 36864]
-
blk.19.post_attention_norm.weightF32[4608]
-
blk.19.post_ffw_norm.weightF32[4608]
-
blk.19.ffn_norm.weightF32[4608]
-
blk.19.attn_k.weightQ4_K[4608 2048]
-
blk.19.attn_output.weightQ4_K[4096 4608]
-
blk.19.attn_q.weightQ4_K[4608 4096]
-
blk.19.attn_v.weightQ4_K[4608 2048]
-
blk.20.attn_norm.weightF32[4608]
-
blk.20.ffn_down.weightQ6_K[36864 4608]
-
blk.20.ffn_gate.weightQ4_K[4608 36864]
-
blk.20.ffn_up.weightQ4_K[4608 36864]
-
blk.20.post_attention_norm.weightF32[4608]
-
blk.20.post_ffw_norm.weightF32[4608]
-
blk.20.ffn_norm.weightF32[4608]
-
blk.20.attn_k.weightQ4_K[4608 2048]
-
blk.20.attn_output.weightQ4_K[4096 4608]
-
blk.20.attn_q.weightQ4_K[4608 4096]
-
blk.20.attn_v.weightQ6_K[4608 2048]
-
blk.21.attn_norm.weightF32[4608]
-
blk.21.ffn_down.weightQ4_K[36864 4608]
-
blk.21.ffn_gate.weightQ4_K[4608 36864]
-
blk.21.ffn_up.weightQ4_K[4608 36864]
-
blk.21.post_attention_norm.weightF32[4608]
-
blk.21.post_ffw_norm.weightF32[4608]
-
blk.21.ffn_norm.weightF32[4608]
-
blk.21.attn_k.weightQ4_K[4608 2048]
-
blk.21.attn_output.weightQ4_K[4096 4608]
-
blk.21.attn_q.weightQ4_K[4608 4096]
-
blk.21.attn_v.weightQ4_K[4608 2048]
-
blk.22.attn_norm.weightF32[4608]
-
blk.22.ffn_down.weightQ4_K[36864 4608]
-
blk.22.ffn_gate.weightQ4_K[4608 36864]
-
blk.22.ffn_up.weightQ4_K[4608 36864]
-
blk.22.post_attention_norm.weightF32[4608]
-
blk.22.post_ffw_norm.weightF32[4608]
-
blk.22.ffn_norm.weightF32[4608]
-
blk.22.attn_k.weightQ4_K[4608 2048]
-
blk.22.attn_output.weightQ4_K[4096 4608]
-
blk.22.attn_q.weightQ4_K[4608 4096]
-
blk.22.attn_v.weightQ4_K[4608 2048]
-
blk.23.attn_norm.weightF32[4608]
-
blk.23.ffn_down.weightQ6_K[36864 4608]
-
blk.23.ffn_gate.weightQ4_K[4608 36864]
-
blk.23.ffn_up.weightQ4_K[4608 36864]
-
blk.23.post_attention_norm.weightF32[4608]
-
blk.23.post_ffw_norm.weightF32[4608]
-
blk.23.ffn_norm.weightF32[4608]
-
blk.23.attn_k.weightQ4_K[4608 2048]
-
blk.23.attn_output.weightQ4_K[4096 4608]
-
blk.23.attn_q.weightQ4_K[4608 4096]
-
blk.23.attn_v.weightQ6_K[4608 2048]
-
blk.24.attn_norm.weightF32[4608]
-
blk.24.ffn_down.weightQ4_K[36864 4608]
-
blk.24.ffn_gate.weightQ4_K[4608 36864]
-
blk.24.ffn_up.weightQ4_K[4608 36864]
-
blk.24.post_attention_norm.weightF32[4608]
-
blk.24.post_ffw_norm.weightF32[4608]
-
blk.24.ffn_norm.weightF32[4608]
-
blk.24.attn_k.weightQ4_K[4608 2048]
-
blk.24.attn_output.weightQ4_K[4096 4608]
-
blk.24.attn_q.weightQ4_K[4608 4096]
-
blk.24.attn_v.weightQ4_K[4608 2048]
-
blk.25.attn_norm.weightF32[4608]
-
blk.25.ffn_down.weightQ4_K[36864 4608]
-
blk.25.ffn_gate.weightQ4_K[4608 36864]
-
blk.25.ffn_up.weightQ4_K[4608 36864]
-
blk.25.post_attention_norm.weightF32[4608]
-
blk.25.post_ffw_norm.weightF32[4608]
-
blk.25.ffn_norm.weightF32[4608]
-
blk.25.attn_k.weightQ4_K[4608 2048]
-
blk.25.attn_output.weightQ4_K[4096 4608]
-
blk.25.attn_q.weightQ4_K[4608 4096]
-
blk.25.attn_v.weightQ4_K[4608 2048]
-
blk.26.attn_norm.weightF32[4608]
-
blk.26.ffn_down.weightQ6_K[36864 4608]
-
blk.26.ffn_gate.weightQ4_K[4608 36864]
-
blk.26.ffn_up.weightQ4_K[4608 36864]
-
blk.26.post_attention_norm.weightF32[4608]
-
blk.26.post_ffw_norm.weightF32[4608]
-
blk.26.ffn_norm.weightF32[4608]
-
blk.26.attn_k.weightQ4_K[4608 2048]
-
blk.26.attn_output.weightQ4_K[4096 4608]
-
blk.26.attn_q.weightQ4_K[4608 4096]
-
blk.26.attn_v.weightQ6_K[4608 2048]
-
blk.27.attn_norm.weightF32[4608]
-
blk.27.ffn_down.weightQ4_K[36864 4608]
-
blk.27.ffn_gate.weightQ4_K[4608 36864]
-
blk.27.ffn_up.weightQ4_K[4608 36864]
-
blk.27.post_attention_norm.weightF32[4608]
-
blk.27.post_ffw_norm.weightF32[4608]
-
blk.27.ffn_norm.weightF32[4608]
-
blk.27.attn_k.weightQ4_K[4608 2048]
-
blk.27.attn_output.weightQ4_K[4096 4608]
-
blk.27.attn_q.weightQ4_K[4608 4096]
-
blk.27.attn_v.weightQ4_K[4608 2048]
-
blk.28.attn_norm.weightF32[4608]
-
blk.28.ffn_down.weightQ4_K[36864 4608]
-
blk.28.ffn_gate.weightQ4_K[4608 36864]
-
blk.28.ffn_up.weightQ4_K[4608 36864]
-
blk.28.post_attention_norm.weightF32[4608]
-
blk.28.post_ffw_norm.weightF32[4608]
-
blk.28.ffn_norm.weightF32[4608]
-
blk.28.attn_k.weightQ4_K[4608 2048]
-
blk.28.attn_output.weightQ4_K[4096 4608]
-
blk.28.attn_q.weightQ4_K[4608 4096]
-
blk.28.attn_v.weightQ4_K[4608 2048]
-
blk.29.attn_norm.weightF32[4608]
-
blk.29.ffn_down.weightQ6_K[36864 4608]
-
blk.29.ffn_gate.weightQ4_K[4608 36864]
-
blk.29.ffn_up.weightQ4_K[4608 36864]
-
blk.29.post_attention_norm.weightF32[4608]
-
blk.29.post_ffw_norm.weightF32[4608]
-
blk.29.ffn_norm.weightF32[4608]
-
blk.29.attn_k.weightQ4_K[4608 2048]
-
blk.29.attn_output.weightQ4_K[4096 4608]
-
blk.29.attn_q.weightQ4_K[4608 4096]
-
blk.29.attn_v.weightQ6_K[4608 2048]
-
blk.30.attn_norm.weightF32[4608]
-
blk.30.ffn_down.weightQ4_K[36864 4608]
-
blk.30.ffn_gate.weightQ4_K[4608 36864]
-
blk.30.ffn_up.weightQ4_K[4608 36864]
-
blk.30.post_attention_norm.weightF32[4608]
-
blk.30.post_ffw_norm.weightF32[4608]
-
blk.30.ffn_norm.weightF32[4608]
-
blk.30.attn_k.weightQ4_K[4608 2048]
-
blk.30.attn_output.weightQ4_K[4096 4608]
-
blk.30.attn_q.weightQ4_K[4608 4096]
-
blk.30.attn_v.weightQ4_K[4608 2048]
-
blk.31.attn_norm.weightF32[4608]
-
blk.31.ffn_down.weightQ6_K[36864 4608]
-
blk.31.ffn_gate.weightQ4_K[4608 36864]
-
blk.31.ffn_up.weightQ4_K[4608 36864]
-
blk.31.post_attention_norm.weightF32[4608]
-
blk.31.post_ffw_norm.weightF32[4608]
-
blk.31.ffn_norm.weightF32[4608]
-
blk.31.attn_k.weightQ4_K[4608 2048]
-
blk.31.attn_output.weightQ4_K[4096 4608]
-
blk.31.attn_q.weightQ4_K[4608 4096]
-
blk.31.attn_v.weightQ6_K[4608 2048]
-
blk.32.attn_norm.weightF32[4608]
-
blk.32.ffn_down.weightQ4_K[36864 4608]
-
blk.32.ffn_gate.weightQ4_K[4608 36864]
-
blk.32.ffn_up.weightQ4_K[4608 36864]
-
blk.32.post_attention_norm.weightF32[4608]
-
blk.32.post_ffw_norm.weightF32[4608]
-
blk.32.ffn_norm.weightF32[4608]
-
blk.32.attn_k.weightQ4_K[4608 2048]
-
blk.32.attn_output.weightQ4_K[4096 4608]
-
blk.32.attn_q.weightQ4_K[4608 4096]
-
blk.32.attn_v.weightQ4_K[4608 2048]
-
blk.33.attn_norm.weightF32[4608]
-
blk.33.ffn_down.weightQ4_K[36864 4608]
-
blk.33.ffn_gate.weightQ4_K[4608 36864]
-
blk.33.ffn_up.weightQ4_K[4608 36864]
-
blk.33.post_attention_norm.weightF32[4608]
-
blk.33.post_ffw_norm.weightF32[4608]
-
blk.33.ffn_norm.weightF32[4608]
-
blk.33.attn_k.weightQ4_K[4608 2048]
-
blk.33.attn_output.weightQ4_K[4096 4608]
-
blk.33.attn_q.weightQ4_K[4608 4096]
-
blk.33.attn_v.weightQ4_K[4608 2048]
-
blk.34.attn_norm.weightF32[4608]
-
blk.34.ffn_down.weightQ6_K[36864 4608]
-
blk.34.ffn_gate.weightQ4_K[4608 36864]
-
blk.34.ffn_up.weightQ4_K[4608 36864]
-
blk.34.post_attention_norm.weightF32[4608]
-
blk.34.post_ffw_norm.weightF32[4608]
-
blk.34.ffn_norm.weightF32[4608]
-
blk.34.attn_k.weightQ4_K[4608 2048]
-
blk.34.attn_output.weightQ4_K[4096 4608]
-
blk.34.attn_q.weightQ4_K[4608 4096]
-
blk.34.attn_v.weightQ6_K[4608 2048]
-
blk.35.attn_norm.weightF32[4608]
-
blk.35.ffn_down.weightQ4_K[36864 4608]
-
blk.35.ffn_gate.weightQ4_K[4608 36864]
-
blk.35.ffn_up.weightQ4_K[4608 36864]
-
blk.35.post_attention_norm.weightF32[4608]
-
blk.35.post_ffw_norm.weightF32[4608]
-
blk.35.ffn_norm.weightF32[4608]
-
blk.35.attn_k.weightQ4_K[4608 2048]
-
blk.35.attn_output.weightQ4_K[4096 4608]
-
blk.35.attn_q.weightQ4_K[4608 4096]
-
blk.35.attn_v.weightQ4_K[4608 2048]
-
blk.36.attn_norm.weightF32[4608]
-
blk.36.ffn_down.weightQ4_K[36864 4608]
-
blk.36.ffn_gate.weightQ4_K[4608 36864]
-
blk.36.ffn_up.weightQ4_K[4608 36864]
-
blk.36.post_attention_norm.weightF32[4608]
-
blk.36.post_ffw_norm.weightF32[4608]
-
blk.36.ffn_norm.weightF32[4608]
-
blk.36.attn_k.weightQ4_K[4608 2048]
-
blk.36.attn_output.weightQ4_K[4096 4608]
-
blk.36.attn_q.weightQ4_K[4608 4096]
-
blk.36.attn_v.weightQ4_K[4608 2048]
-
blk.37.attn_norm.weightF32[4608]
-
blk.37.ffn_down.weightQ6_K[36864 4608]
-
blk.37.ffn_gate.weightQ4_K[4608 36864]
-
blk.37.ffn_up.weightQ4_K[4608 36864]
-
blk.37.post_attention_norm.weightF32[4608]
-
blk.37.post_ffw_norm.weightF32[4608]
-
blk.37.ffn_norm.weightF32[4608]
-
blk.37.attn_k.weightQ4_K[4608 2048]
-
blk.37.attn_output.weightQ4_K[4096 4608]
-
blk.37.attn_q.weightQ4_K[4608 4096]
-
blk.37.attn_v.weightQ6_K[4608 2048]
-
blk.38.attn_norm.weightF32[4608]
-
blk.38.ffn_down.weightQ4_K[36864 4608]
-
blk.38.ffn_gate.weightQ4_K[4608 36864]
-
blk.38.ffn_up.weightQ4_K[4608 36864]
-
blk.38.post_attention_norm.weightF32[4608]
-
blk.38.post_ffw_norm.weightF32[4608]
-
blk.38.ffn_norm.weightF32[4608]
-
blk.38.attn_k.weightQ4_K[4608 2048]
-
blk.38.attn_output.weightQ4_K[4096 4608]
-
blk.38.attn_q.weightQ4_K[4608 4096]
-
blk.38.attn_v.weightQ4_K[4608 2048]
-
blk.39.attn_norm.weightF32[4608]
-
blk.39.ffn_down.weightQ4_K[36864 4608]
-
blk.39.ffn_gate.weightQ4_K[4608 36864]
-
blk.39.ffn_up.weightQ4_K[4608 36864]
-
blk.39.post_attention_norm.weightF32[4608]
-
blk.39.post_ffw_norm.weightF32[4608]
-
blk.39.ffn_norm.weightF32[4608]
-
blk.39.attn_k.weightQ4_K[4608 2048]
-
blk.39.attn_output.weightQ4_K[4096 4608]
-
blk.39.attn_q.weightQ4_K[4608 4096]
-
blk.39.attn_v.weightQ4_K[4608 2048]
-
blk.40.attn_norm.weightF32[4608]
-
blk.40.ffn_down.weightQ4_K[36864 4608]
-
blk.40.ffn_gate.weightQ4_K[4608 36864]
-
blk.40.ffn_up.weightQ4_K[4608 36864]
-
blk.40.post_attention_norm.weightF32[4608]
-
blk.40.post_ffw_norm.weightF32[4608]
-
blk.40.ffn_norm.weightF32[4608]
-
blk.40.attn_k.weightQ4_K[4608 2048]
-
blk.40.attn_output.weightQ4_K[4096 4608]
-
blk.40.attn_q.weightQ4_K[4608 4096]
-
blk.40.attn_v.weightQ4_K[4608 2048]
-
blk.41.attn_norm.weightF32[4608]
-
blk.41.ffn_down.weightQ4_K[36864 4608]
-
blk.41.ffn_gate.weightQ4_K[4608 36864]
-
blk.41.ffn_up.weightQ4_K[4608 36864]
-
blk.41.post_attention_norm.weightF32[4608]
-
blk.41.post_ffw_norm.weightF32[4608]
-
blk.41.ffn_norm.weightF32[4608]
-
blk.41.attn_k.weightQ4_K[4608 2048]
-
blk.41.attn_output.weightQ4_K[4096 4608]
-
blk.41.attn_q.weightQ4_K[4608 4096]
-
blk.41.attn_v.weightQ4_K[4608 2048]
-
blk.42.attn_norm.weightF32[4608]
-
blk.42.ffn_down.weightQ6_K[36864 4608]
-
blk.42.ffn_gate.weightQ4_K[4608 36864]
-
blk.42.ffn_up.weightQ4_K[4608 36864]
-
blk.42.post_attention_norm.weightF32[4608]
-
blk.42.post_ffw_norm.weightF32[4608]
-
blk.42.ffn_norm.weightF32[4608]
-
blk.42.attn_k.weightQ4_K[4608 2048]
-
blk.42.attn_output.weightQ4_K[4096 4608]
-
blk.42.attn_q.weightQ4_K[4608 4096]
-
blk.42.attn_v.weightQ6_K[4608 2048]
-
blk.43.attn_norm.weightF32[4608]
-
blk.43.ffn_down.weightQ4_K[36864 4608]
-
blk.43.ffn_gate.weightQ4_K[4608 36864]
-
blk.43.ffn_up.weightQ4_K[4608 36864]
-
blk.43.post_attention_norm.weightF32[4608]
-
blk.43.post_ffw_norm.weightF32[4608]
-
blk.43.ffn_norm.weightF32[4608]
-
blk.43.attn_k.weightQ4_K[4608 2048]
-
blk.43.attn_output.weightQ4_K[4096 4608]
-
blk.43.attn_q.weightQ4_K[4608 4096]
-
blk.43.attn_v.weightQ4_K[4608 2048]
-
blk.44.attn_norm.weightF32[4608]
-
blk.44.ffn_down.weightQ4_K[36864 4608]
-
blk.44.ffn_gate.weightQ4_K[4608 36864]
-
blk.44.ffn_up.weightQ4_K[4608 36864]
-
blk.44.post_attention_norm.weightF32[4608]
-
blk.44.post_ffw_norm.weightF32[4608]
-
blk.44.ffn_norm.weightF32[4608]
-
blk.44.attn_k.weightQ4_K[4608 2048]
-
blk.44.attn_output.weightQ4_K[4096 4608]
-
blk.44.attn_q.weightQ4_K[4608 4096]
-
blk.44.attn_v.weightQ4_K[4608 2048]
-
blk.45.attn_norm.weightF32[4608]
-
blk.45.ffn_down.weightQ6_K[36864 4608]
-
blk.45.ffn_gate.weightQ4_K[4608 36864]
-
blk.45.ffn_up.weightQ4_K[4608 36864]
-
blk.45.post_attention_norm.weightF32[4608]
-
blk.45.post_ffw_norm.weightF32[4608]
-
blk.45.ffn_norm.weightF32[4608]
-
blk.45.attn_k.weightQ4_K[4608 2048]
-
blk.45.attn_output.weightQ4_K[4096 4608]
-
blk.45.attn_q.weightQ4_K[4608 4096]
-
blk.45.attn_v.weightQ6_K[4608 2048]
-
output_norm.weightF32[4608]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45