InterLM 2.5 20b and 7b from Q4 to Q8
7B
87 Pulls Updated 6 weeks ago
e158fd5243fe · 12GB
-
general.architectureinternlm2
-
general.file_typeQ4_K_M
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base5e+07
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[6144 92544]
-
blk.0.attn_output.weightQ4_K[6144 6144]
-
blk.0.attn_q.weightQ4_K[6144 6144]
-
blk.0.attn_k.weightQ4_K[6144 1024]
-
blk.0.attn_v.weightQ6_K[6144 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_gate.weightQ4_K[6144 16384]
-
blk.0.ffn_down.weightQ6_K[16384 6144]
-
blk.0.ffn_up.weightQ4_K[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.1.attn_output.weightQ4_K[6144 6144]
-
blk.1.attn_q.weightQ4_K[6144 6144]
-
blk.1.attn_k.weightQ4_K[6144 1024]
-
blk.1.attn_v.weightQ6_K[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_gate.weightQ4_K[6144 16384]
-
blk.1.ffn_down.weightQ6_K[16384 6144]
-
blk.1.ffn_up.weightQ4_K[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.2.attn_output.weightQ4_K[6144 6144]
-
blk.2.attn_q.weightQ4_K[6144 6144]
-
blk.2.attn_k.weightQ4_K[6144 1024]
-
blk.2.attn_v.weightQ6_K[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_gate.weightQ4_K[6144 16384]
-
blk.2.ffn_down.weightQ6_K[16384 6144]
-
blk.2.ffn_up.weightQ4_K[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.3.attn_output.weightQ4_K[6144 6144]
-
blk.3.attn_q.weightQ4_K[6144 6144]
-
blk.3.attn_k.weightQ4_K[6144 1024]
-
blk.3.attn_v.weightQ6_K[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_gate.weightQ4_K[6144 16384]
-
blk.3.ffn_down.weightQ6_K[16384 6144]
-
blk.3.ffn_up.weightQ4_K[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.4.attn_output.weightQ4_K[6144 6144]
-
blk.4.attn_q.weightQ4_K[6144 6144]
-
blk.4.attn_k.weightQ4_K[6144 1024]
-
blk.4.attn_v.weightQ4_K[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_gate.weightQ4_K[6144 16384]
-
blk.4.ffn_down.weightQ6_K[16384 6144]
-
blk.4.ffn_up.weightQ4_K[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.5.attn_output.weightQ4_K[6144 6144]
-
blk.5.attn_q.weightQ4_K[6144 6144]
-
blk.5.attn_k.weightQ4_K[6144 1024]
-
blk.5.attn_v.weightQ4_K[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_gate.weightQ4_K[6144 16384]
-
blk.5.ffn_down.weightQ4_K[16384 6144]
-
blk.5.ffn_up.weightQ4_K[6144 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_output.weightQ4_K[6144 6144]
-
blk.6.attn_q.weightQ4_K[6144 6144]
-
blk.6.attn_k.weightQ4_K[6144 1024]
-
blk.6.attn_v.weightQ6_K[6144 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_gate.weightQ4_K[6144 16384]
-
blk.6.ffn_down.weightQ4_K[16384 6144]
-
blk.6.ffn_up.weightQ4_K[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.7.attn_output.weightQ4_K[6144 6144]
-
blk.7.attn_q.weightQ4_K[6144 6144]
-
blk.7.attn_k.weightQ4_K[6144 1024]
-
blk.7.attn_v.weightQ4_K[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_gate.weightQ4_K[6144 16384]
-
blk.7.ffn_down.weightQ6_K[16384 6144]
-
blk.7.ffn_up.weightQ4_K[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.8.attn_output.weightQ4_K[6144 6144]
-
blk.8.attn_q.weightQ4_K[6144 6144]
-
blk.8.attn_k.weightQ4_K[6144 1024]
-
blk.8.attn_v.weightQ4_K[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_gate.weightQ4_K[6144 16384]
-
blk.8.ffn_down.weightQ4_K[16384 6144]
-
blk.8.ffn_up.weightQ4_K[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.9.attn_output.weightQ4_K[6144 6144]
-
blk.9.attn_q.weightQ4_K[6144 6144]
-
blk.9.attn_k.weightQ4_K[6144 1024]
-
blk.9.attn_v.weightQ6_K[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_gate.weightQ4_K[6144 16384]
-
blk.9.ffn_down.weightQ4_K[16384 6144]
-
blk.9.ffn_up.weightQ4_K[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.10.attn_output.weightQ4_K[6144 6144]
-
blk.10.attn_q.weightQ4_K[6144 6144]
-
blk.10.attn_k.weightQ4_K[6144 1024]
-
blk.10.attn_v.weightQ6_K[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_gate.weightQ4_K[6144 16384]
-
blk.10.ffn_down.weightQ6_K[16384 6144]
-
blk.10.ffn_up.weightQ4_K[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.11.attn_output.weightQ4_K[6144 6144]
-
blk.11.attn_q.weightQ4_K[6144 6144]
-
blk.11.attn_k.weightQ4_K[6144 1024]
-
blk.11.attn_v.weightQ6_K[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_gate.weightQ4_K[6144 16384]
-
blk.11.ffn_down.weightQ6_K[16384 6144]
-
blk.11.ffn_up.weightQ4_K[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.12.attn_output.weightQ4_K[6144 6144]
-
blk.12.attn_q.weightQ4_K[6144 6144]
-
blk.12.attn_k.weightQ4_K[6144 1024]
-
blk.12.attn_v.weightQ4_K[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_gate.weightQ4_K[6144 16384]
-
blk.12.ffn_down.weightQ4_K[16384 6144]
-
blk.12.ffn_up.weightQ4_K[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.13.attn_output.weightQ4_K[6144 6144]
-
blk.13.attn_q.weightQ4_K[6144 6144]
-
blk.13.attn_k.weightQ4_K[6144 1024]
-
blk.13.attn_v.weightQ4_K[6144 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_gate.weightQ4_K[6144 16384]
-
blk.13.ffn_down.weightQ4_K[16384 6144]
-
blk.13.ffn_up.weightQ4_K[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.14.attn_output.weightQ4_K[6144 6144]
-
blk.14.attn_q.weightQ4_K[6144 6144]
-
blk.14.attn_k.weightQ4_K[6144 1024]
-
blk.14.attn_v.weightQ6_K[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_gate.weightQ4_K[6144 16384]
-
blk.14.ffn_down.weightQ6_K[16384 6144]
-
blk.14.ffn_up.weightQ4_K[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.15.attn_output.weightQ4_K[6144 6144]
-
blk.15.attn_q.weightQ4_K[6144 6144]
-
blk.15.attn_k.weightQ4_K[6144 1024]
-
blk.15.attn_v.weightQ4_K[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_gate.weightQ4_K[6144 16384]
-
blk.15.ffn_down.weightQ4_K[16384 6144]
-
blk.15.ffn_up.weightQ4_K[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.16.attn_output.weightQ4_K[6144 6144]
-
blk.16.attn_q.weightQ4_K[6144 6144]
-
blk.16.attn_k.weightQ4_K[6144 1024]
-
blk.16.attn_v.weightQ4_K[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_gate.weightQ4_K[6144 16384]
-
blk.16.ffn_down.weightQ4_K[16384 6144]
-
blk.16.ffn_up.weightQ4_K[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.17.attn_output.weightQ4_K[6144 6144]
-
blk.17.attn_q.weightQ4_K[6144 6144]
-
blk.17.attn_k.weightQ4_K[6144 1024]
-
blk.17.attn_v.weightQ6_K[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_gate.weightQ4_K[6144 16384]
-
blk.17.ffn_down.weightQ6_K[16384 6144]
-
blk.17.ffn_up.weightQ4_K[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.18.attn_output.weightQ4_K[6144 6144]
-
blk.18.attn_q.weightQ4_K[6144 6144]
-
blk.18.attn_k.weightQ4_K[6144 1024]
-
blk.18.attn_v.weightQ4_K[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_gate.weightQ4_K[6144 16384]
-
blk.18.ffn_down.weightQ4_K[16384 6144]
-
blk.18.ffn_up.weightQ4_K[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_output.weightQ4_K[6144 6144]
-
blk.19.attn_q.weightQ4_K[6144 6144]
-
blk.19.attn_k.weightQ4_K[6144 1024]
-
blk.19.attn_v.weightQ4_K[6144 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_gate.weightQ4_K[6144 16384]
-
blk.19.ffn_down.weightQ4_K[16384 6144]
-
blk.19.ffn_up.weightQ4_K[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.20.attn_output.weightQ4_K[6144 6144]
-
blk.20.attn_q.weightQ4_K[6144 6144]
-
blk.20.attn_k.weightQ4_K[6144 1024]
-
blk.20.attn_v.weightQ6_K[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_gate.weightQ4_K[6144 16384]
-
blk.20.ffn_down.weightQ6_K[16384 6144]
-
blk.20.ffn_up.weightQ4_K[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.21.attn_output.weightQ4_K[6144 6144]
-
blk.21.attn_q.weightQ4_K[6144 6144]
-
blk.21.attn_k.weightQ4_K[6144 1024]
-
blk.21.attn_v.weightQ4_K[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_gate.weightQ4_K[6144 16384]
-
blk.21.ffn_down.weightQ4_K[16384 6144]
-
blk.21.ffn_up.weightQ4_K[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.22.attn_output.weightQ4_K[6144 6144]
-
blk.22.attn_q.weightQ4_K[6144 6144]
-
blk.22.attn_k.weightQ4_K[6144 1024]
-
blk.22.attn_v.weightQ4_K[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_gate.weightQ4_K[6144 16384]
-
blk.22.ffn_down.weightQ4_K[16384 6144]
-
blk.22.ffn_up.weightQ4_K[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.23.attn_output.weightQ4_K[6144 6144]
-
blk.23.attn_q.weightQ4_K[6144 6144]
-
blk.23.attn_k.weightQ4_K[6144 1024]
-
blk.23.attn_v.weightQ6_K[6144 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_gate.weightQ4_K[6144 16384]
-
blk.23.ffn_down.weightQ6_K[16384 6144]
-
blk.23.ffn_up.weightQ4_K[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.24.attn_output.weightQ4_K[6144 6144]
-
blk.24.attn_q.weightQ4_K[6144 6144]
-
blk.24.attn_k.weightQ4_K[6144 1024]
-
blk.24.attn_v.weightQ4_K[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_gate.weightQ4_K[6144 16384]
-
blk.24.ffn_down.weightQ4_K[16384 6144]
-
blk.24.ffn_up.weightQ4_K[6144 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.25.attn_output.weightQ4_K[6144 6144]
-
blk.25.attn_q.weightQ4_K[6144 6144]
-
blk.25.attn_k.weightQ4_K[6144 1024]
-
blk.25.attn_v.weightQ4_K[6144 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_gate.weightQ4_K[6144 16384]
-
blk.25.ffn_down.weightQ4_K[16384 6144]
-
blk.25.ffn_up.weightQ4_K[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.26.attn_output.weightQ4_K[6144 6144]
-
blk.26.attn_q.weightQ4_K[6144 6144]
-
blk.26.attn_k.weightQ4_K[6144 1024]
-
blk.26.attn_v.weightQ6_K[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_gate.weightQ4_K[6144 16384]
-
blk.26.ffn_down.weightQ6_K[16384 6144]
-
blk.26.ffn_up.weightQ4_K[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.27.attn_output.weightQ4_K[6144 6144]
-
blk.27.attn_q.weightQ4_K[6144 6144]
-
blk.27.attn_k.weightQ4_K[6144 1024]
-
blk.27.attn_v.weightQ4_K[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_gate.weightQ4_K[6144 16384]
-
blk.27.ffn_down.weightQ4_K[16384 6144]
-
blk.27.ffn_up.weightQ4_K[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.28.attn_output.weightQ4_K[6144 6144]
-
blk.28.attn_q.weightQ4_K[6144 6144]
-
blk.28.attn_k.weightQ4_K[6144 1024]
-
blk.28.attn_v.weightQ4_K[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_gate.weightQ4_K[6144 16384]
-
blk.28.ffn_down.weightQ4_K[16384 6144]
-
blk.28.ffn_up.weightQ4_K[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.29.attn_output.weightQ4_K[6144 6144]
-
blk.29.attn_q.weightQ4_K[6144 6144]
-
blk.29.attn_k.weightQ4_K[6144 1024]
-
blk.29.attn_v.weightQ6_K[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_gate.weightQ4_K[6144 16384]
-
blk.29.ffn_down.weightQ6_K[16384 6144]
-
blk.29.ffn_up.weightQ4_K[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.30.attn_output.weightQ4_K[6144 6144]
-
blk.30.attn_q.weightQ4_K[6144 6144]
-
blk.30.attn_k.weightQ4_K[6144 1024]
-
blk.30.attn_v.weightQ4_K[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_gate.weightQ4_K[6144 16384]
-
blk.30.ffn_down.weightQ4_K[16384 6144]
-
blk.30.ffn_up.weightQ4_K[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.31.attn_output.weightQ4_K[6144 6144]
-
blk.31.attn_q.weightQ4_K[6144 6144]
-
blk.31.attn_k.weightQ4_K[6144 1024]
-
blk.31.attn_v.weightQ4_K[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_gate.weightQ4_K[6144 16384]
-
blk.31.ffn_down.weightQ4_K[16384 6144]
-
blk.31.ffn_up.weightQ4_K[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.32.attn_output.weightQ4_K[6144 6144]
-
blk.32.attn_q.weightQ4_K[6144 6144]
-
blk.32.attn_k.weightQ4_K[6144 1024]
-
blk.32.attn_v.weightQ6_K[6144 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_gate.weightQ4_K[6144 16384]
-
blk.32.ffn_down.weightQ6_K[16384 6144]
-
blk.32.ffn_up.weightQ4_K[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.33.attn_output.weightQ4_K[6144 6144]
-
blk.33.attn_q.weightQ4_K[6144 6144]
-
blk.33.attn_k.weightQ4_K[6144 1024]
-
blk.33.attn_v.weightQ4_K[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_gate.weightQ4_K[6144 16384]
-
blk.33.ffn_down.weightQ4_K[16384 6144]
-
blk.33.ffn_up.weightQ4_K[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.34.attn_output.weightQ4_K[6144 6144]
-
blk.34.attn_q.weightQ4_K[6144 6144]
-
blk.34.attn_k.weightQ4_K[6144 1024]
-
blk.34.attn_v.weightQ4_K[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_gate.weightQ4_K[6144 16384]
-
blk.34.ffn_down.weightQ4_K[16384 6144]
-
blk.34.ffn_up.weightQ4_K[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.35.attn_output.weightQ4_K[6144 6144]
-
blk.35.attn_q.weightQ4_K[6144 6144]
-
blk.35.attn_k.weightQ4_K[6144 1024]
-
blk.35.attn_v.weightQ6_K[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_gate.weightQ4_K[6144 16384]
-
blk.35.ffn_down.weightQ6_K[16384 6144]
-
blk.35.ffn_up.weightQ4_K[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.36.attn_output.weightQ4_K[6144 6144]
-
blk.36.attn_q.weightQ4_K[6144 6144]
-
blk.36.attn_k.weightQ4_K[6144 1024]
-
blk.36.attn_v.weightQ4_K[6144 1024]
-
blk.36.ffn_gate.weightQ4_K[6144 16384]
-
blk.36.ffn_up.weightQ4_K[6144 16384]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_down.weightQ4_K[16384 6144]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.37.attn_output.weightQ4_K[6144 6144]
-
blk.37.attn_q.weightQ4_K[6144 6144]
-
blk.37.attn_k.weightQ4_K[6144 1024]
-
blk.37.attn_v.weightQ4_K[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_gate.weightQ4_K[6144 16384]
-
blk.37.ffn_down.weightQ4_K[16384 6144]
-
blk.37.ffn_up.weightQ4_K[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.attn_output.weightQ4_K[6144 6144]
-
blk.38.attn_q.weightQ4_K[6144 6144]
-
blk.38.attn_k.weightQ4_K[6144 1024]
-
blk.38.attn_v.weightQ6_K[6144 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_gate.weightQ4_K[6144 16384]
-
blk.38.ffn_down.weightQ6_K[16384 6144]
-
blk.38.ffn_up.weightQ4_K[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.39.attn_output.weightQ4_K[6144 6144]
-
blk.39.attn_q.weightQ4_K[6144 6144]
-
blk.39.attn_k.weightQ4_K[6144 1024]
-
blk.39.attn_v.weightQ4_K[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_gate.weightQ4_K[6144 16384]
-
blk.39.ffn_down.weightQ4_K[16384 6144]
-
blk.39.ffn_up.weightQ4_K[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.40.attn_output.weightQ4_K[6144 6144]
-
blk.40.attn_q.weightQ4_K[6144 6144]
-
blk.40.attn_k.weightQ4_K[6144 1024]
-
blk.40.attn_v.weightQ4_K[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_gate.weightQ4_K[6144 16384]
-
blk.40.ffn_down.weightQ4_K[16384 6144]
-
blk.40.ffn_up.weightQ4_K[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.41.attn_output.weightQ4_K[6144 6144]
-
blk.41.attn_q.weightQ4_K[6144 6144]
-
blk.41.attn_k.weightQ4_K[6144 1024]
-
blk.41.attn_v.weightQ6_K[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_gate.weightQ4_K[6144 16384]
-
blk.41.ffn_down.weightQ6_K[16384 6144]
-
blk.41.ffn_up.weightQ4_K[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.42.attn_output.weightQ4_K[6144 6144]
-
blk.42.attn_q.weightQ4_K[6144 6144]
-
blk.42.attn_k.weightQ4_K[6144 1024]
-
blk.42.attn_v.weightQ6_K[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_gate.weightQ4_K[6144 16384]
-
blk.42.ffn_down.weightQ6_K[16384 6144]
-
blk.42.ffn_up.weightQ4_K[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.43.attn_output.weightQ4_K[6144 6144]
-
blk.43.attn_q.weightQ4_K[6144 6144]
-
blk.43.attn_k.weightQ4_K[6144 1024]
-
blk.43.attn_v.weightQ6_K[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_gate.weightQ4_K[6144 16384]
-
blk.43.ffn_down.weightQ6_K[16384 6144]
-
blk.43.ffn_up.weightQ4_K[6144 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.attn_output.weightQ4_K[6144 6144]
-
blk.44.attn_q.weightQ4_K[6144 6144]
-
blk.44.attn_k.weightQ4_K[6144 1024]
-
blk.44.attn_v.weightQ6_K[6144 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_gate.weightQ4_K[6144 16384]
-
blk.44.ffn_down.weightQ6_K[16384 6144]
-
blk.44.ffn_up.weightQ4_K[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.45.attn_output.weightQ4_K[6144 6144]
-
blk.45.attn_q.weightQ4_K[6144 6144]
-
blk.45.attn_k.weightQ4_K[6144 1024]
-
blk.45.attn_v.weightQ6_K[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_gate.weightQ4_K[6144 16384]
-
blk.45.ffn_down.weightQ6_K[16384 6144]
-
blk.45.ffn_up.weightQ4_K[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.46.attn_output.weightQ4_K[6144 6144]
-
blk.46.attn_q.weightQ4_K[6144 6144]
-
blk.46.attn_k.weightQ4_K[6144 1024]
-
blk.46.attn_v.weightQ6_K[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_gate.weightQ4_K[6144 16384]
-
blk.46.ffn_down.weightQ6_K[16384 6144]
-
blk.46.ffn_up.weightQ4_K[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.47.attn_output.weightQ4_K[6144 6144]
-
blk.47.attn_q.weightQ4_K[6144 6144]
-
blk.47.attn_k.weightQ4_K[6144 1024]
-
blk.47.attn_v.weightQ6_K[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_gate.weightQ4_K[6144 16384]
-
blk.47.ffn_down.weightQ6_K[16384 6144]
-
blk.47.ffn_up.weightQ4_K[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
output_norm.weightF32[6144]
-
output.weightQ6_K[6144 92544]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47