latest
11GB
15 Pulls Updated 4 months ago
7dea45d84113 · 11GB
-
general.architectureinternlm2
-
general.file_typeQ4_0
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
NameTypeShape
-
token_embd.weightQ4_0[6144 92544]
-
blk.0.attn_output.weightQ4_0[6144 6144]
-
blk.0.attn_q.weightQ4_0[6144 6144]
-
blk.0.attn_k.weightQ4_0[6144 1024]
-
blk.0.attn_v.weightQ4_0[6144 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_gate.weightQ4_0[6144 16384]
-
blk.0.ffn_down.weightQ4_0[16384 6144]
-
blk.0.ffn_up.weightQ4_0[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.1.attn_output.weightQ4_0[6144 6144]
-
blk.1.attn_q.weightQ4_0[6144 6144]
-
blk.1.attn_k.weightQ4_0[6144 1024]
-
blk.1.attn_v.weightQ4_0[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_gate.weightQ4_0[6144 16384]
-
blk.1.ffn_down.weightQ4_0[16384 6144]
-
blk.1.ffn_up.weightQ4_0[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.2.attn_output.weightQ4_0[6144 6144]
-
blk.2.attn_q.weightQ4_0[6144 6144]
-
blk.2.attn_k.weightQ4_0[6144 1024]
-
blk.2.attn_v.weightQ4_0[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_gate.weightQ4_0[6144 16384]
-
blk.2.ffn_down.weightQ4_0[16384 6144]
-
blk.2.ffn_up.weightQ4_0[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.3.attn_output.weightQ4_0[6144 6144]
-
blk.3.attn_q.weightQ4_0[6144 6144]
-
blk.3.attn_k.weightQ4_0[6144 1024]
-
blk.3.attn_v.weightQ4_0[6144 1024]
-
blk.3.ffn_gate.weightQ4_0[6144 16384]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_down.weightQ4_0[16384 6144]
-
blk.3.ffn_up.weightQ4_0[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.4.attn_output.weightQ4_0[6144 6144]
-
blk.4.attn_q.weightQ4_0[6144 6144]
-
blk.4.attn_k.weightQ4_0[6144 1024]
-
blk.4.attn_v.weightQ4_0[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_gate.weightQ4_0[6144 16384]
-
blk.4.ffn_down.weightQ4_0[16384 6144]
-
blk.4.ffn_up.weightQ4_0[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.5.attn_output.weightQ4_0[6144 6144]
-
blk.5.attn_q.weightQ4_0[6144 6144]
-
blk.5.attn_k.weightQ4_0[6144 1024]
-
blk.5.attn_v.weightQ4_0[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_gate.weightQ4_0[6144 16384]
-
blk.5.ffn_down.weightQ4_0[16384 6144]
-
blk.5.ffn_up.weightQ4_0[6144 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_output.weightQ4_0[6144 6144]
-
blk.6.attn_q.weightQ4_0[6144 6144]
-
blk.6.attn_k.weightQ4_0[6144 1024]
-
blk.6.attn_v.weightQ4_0[6144 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_gate.weightQ4_0[6144 16384]
-
blk.6.ffn_down.weightQ4_0[16384 6144]
-
blk.6.ffn_up.weightQ4_0[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.7.attn_output.weightQ4_0[6144 6144]
-
blk.7.attn_q.weightQ4_0[6144 6144]
-
blk.7.attn_k.weightQ4_0[6144 1024]
-
blk.7.attn_v.weightQ4_0[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_gate.weightQ4_0[6144 16384]
-
blk.7.ffn_down.weightQ4_0[16384 6144]
-
blk.7.ffn_up.weightQ4_0[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.8.attn_output.weightQ4_0[6144 6144]
-
blk.8.attn_q.weightQ4_0[6144 6144]
-
blk.8.attn_k.weightQ4_0[6144 1024]
-
blk.8.attn_v.weightQ4_0[6144 1024]
-
blk.8.ffn_gate.weightQ4_0[6144 16384]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_down.weightQ4_0[16384 6144]
-
blk.8.ffn_up.weightQ4_0[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.9.attn_output.weightQ4_0[6144 6144]
-
blk.9.attn_q.weightQ4_0[6144 6144]
-
blk.9.attn_k.weightQ4_0[6144 1024]
-
blk.9.attn_v.weightQ4_0[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_gate.weightQ4_0[6144 16384]
-
blk.9.ffn_down.weightQ4_0[16384 6144]
-
blk.9.ffn_up.weightQ4_0[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.10.attn_output.weightQ4_0[6144 6144]
-
blk.10.attn_q.weightQ4_0[6144 6144]
-
blk.10.attn_k.weightQ4_0[6144 1024]
-
blk.10.attn_v.weightQ4_0[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_gate.weightQ4_0[6144 16384]
-
blk.10.ffn_down.weightQ4_0[16384 6144]
-
blk.10.ffn_up.weightQ4_0[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.11.attn_output.weightQ4_0[6144 6144]
-
blk.11.attn_q.weightQ4_0[6144 6144]
-
blk.11.attn_k.weightQ4_0[6144 1024]
-
blk.11.attn_v.weightQ4_0[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_gate.weightQ4_0[6144 16384]
-
blk.11.ffn_down.weightQ4_0[16384 6144]
-
blk.11.ffn_up.weightQ4_0[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.12.attn_output.weightQ4_0[6144 6144]
-
blk.12.attn_q.weightQ4_0[6144 6144]
-
blk.12.attn_k.weightQ4_0[6144 1024]
-
blk.12.attn_v.weightQ4_0[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_gate.weightQ4_0[6144 16384]
-
blk.12.ffn_down.weightQ4_0[16384 6144]
-
blk.12.ffn_up.weightQ4_0[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.13.attn_output.weightQ4_0[6144 6144]
-
blk.13.attn_q.weightQ4_0[6144 6144]
-
blk.13.attn_k.weightQ4_0[6144 1024]
-
blk.13.attn_v.weightQ4_0[6144 1024]
-
blk.13.ffn_gate.weightQ4_0[6144 16384]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_down.weightQ4_0[16384 6144]
-
blk.13.ffn_up.weightQ4_0[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.14.attn_output.weightQ4_0[6144 6144]
-
blk.14.attn_q.weightQ4_0[6144 6144]
-
blk.14.attn_k.weightQ4_0[6144 1024]
-
blk.14.attn_v.weightQ4_0[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_gate.weightQ4_0[6144 16384]
-
blk.14.ffn_down.weightQ4_0[16384 6144]
-
blk.14.ffn_up.weightQ4_0[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.15.attn_output.weightQ4_0[6144 6144]
-
blk.15.attn_q.weightQ4_0[6144 6144]
-
blk.15.attn_k.weightQ4_0[6144 1024]
-
blk.15.attn_v.weightQ4_0[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_gate.weightQ4_0[6144 16384]
-
blk.15.ffn_down.weightQ4_0[16384 6144]
-
blk.15.ffn_up.weightQ4_0[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.16.attn_output.weightQ4_0[6144 6144]
-
blk.16.attn_q.weightQ4_0[6144 6144]
-
blk.16.attn_k.weightQ4_0[6144 1024]
-
blk.16.attn_v.weightQ4_0[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_gate.weightQ4_0[6144 16384]
-
blk.16.ffn_down.weightQ4_0[16384 6144]
-
blk.16.ffn_up.weightQ4_0[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.17.attn_output.weightQ4_0[6144 6144]
-
blk.17.attn_q.weightQ4_0[6144 6144]
-
blk.17.attn_k.weightQ4_0[6144 1024]
-
blk.17.attn_v.weightQ4_0[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_gate.weightQ4_0[6144 16384]
-
blk.17.ffn_down.weightQ4_0[16384 6144]
-
blk.17.ffn_up.weightQ4_0[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.18.attn_output.weightQ4_0[6144 6144]
-
blk.18.attn_q.weightQ4_0[6144 6144]
-
blk.18.attn_k.weightQ4_0[6144 1024]
-
blk.18.attn_v.weightQ4_0[6144 1024]
-
blk.18.ffn_gate.weightQ4_0[6144 16384]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.weightQ4_0[16384 6144]
-
blk.18.ffn_up.weightQ4_0[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_output.weightQ4_0[6144 6144]
-
blk.19.attn_q.weightQ4_0[6144 6144]
-
blk.19.attn_k.weightQ4_0[6144 1024]
-
blk.19.attn_v.weightQ4_0[6144 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_gate.weightQ4_0[6144 16384]
-
blk.19.ffn_down.weightQ4_0[16384 6144]
-
blk.19.ffn_up.weightQ4_0[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.20.attn_output.weightQ4_0[6144 6144]
-
blk.20.attn_q.weightQ4_0[6144 6144]
-
blk.20.attn_k.weightQ4_0[6144 1024]
-
blk.20.attn_v.weightQ4_0[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_gate.weightQ4_0[6144 16384]
-
blk.20.ffn_down.weightQ4_0[16384 6144]
-
blk.20.ffn_up.weightQ4_0[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.21.attn_output.weightQ4_0[6144 6144]
-
blk.21.attn_q.weightQ4_0[6144 6144]
-
blk.21.attn_k.weightQ4_0[6144 1024]
-
blk.21.attn_v.weightQ4_0[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_gate.weightQ4_0[6144 16384]
-
blk.21.ffn_down.weightQ4_0[16384 6144]
-
blk.21.ffn_up.weightQ4_0[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.22.attn_output.weightQ4_0[6144 6144]
-
blk.22.attn_q.weightQ4_0[6144 6144]
-
blk.22.attn_k.weightQ4_0[6144 1024]
-
blk.22.attn_v.weightQ4_0[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_gate.weightQ4_0[6144 16384]
-
blk.22.ffn_down.weightQ4_0[16384 6144]
-
blk.22.ffn_up.weightQ4_0[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.23.attn_output.weightQ4_0[6144 6144]
-
blk.23.attn_q.weightQ4_0[6144 6144]
-
blk.23.attn_k.weightQ4_0[6144 1024]
-
blk.23.attn_v.weightQ4_0[6144 1024]
-
blk.23.ffn_gate.weightQ4_0[6144 16384]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_down.weightQ4_0[16384 6144]
-
blk.23.ffn_up.weightQ4_0[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.24.attn_output.weightQ4_0[6144 6144]
-
blk.24.attn_q.weightQ4_0[6144 6144]
-
blk.24.attn_k.weightQ4_0[6144 1024]
-
blk.24.attn_v.weightQ4_0[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_gate.weightQ4_0[6144 16384]
-
blk.24.ffn_down.weightQ4_0[16384 6144]
-
blk.24.ffn_up.weightQ4_0[6144 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.25.attn_output.weightQ4_0[6144 6144]
-
blk.25.attn_q.weightQ4_0[6144 6144]
-
blk.25.attn_k.weightQ4_0[6144 1024]
-
blk.25.attn_v.weightQ4_0[6144 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_gate.weightQ4_0[6144 16384]
-
blk.25.ffn_down.weightQ4_0[16384 6144]
-
blk.25.ffn_up.weightQ4_0[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.26.attn_output.weightQ4_0[6144 6144]
-
blk.26.attn_q.weightQ4_0[6144 6144]
-
blk.26.attn_k.weightQ4_0[6144 1024]
-
blk.26.attn_v.weightQ4_0[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_gate.weightQ4_0[6144 16384]
-
blk.26.ffn_down.weightQ4_0[16384 6144]
-
blk.26.ffn_up.weightQ4_0[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.27.attn_output.weightQ4_0[6144 6144]
-
blk.27.attn_q.weightQ4_0[6144 6144]
-
blk.27.attn_k.weightQ4_0[6144 1024]
-
blk.27.attn_v.weightQ4_0[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_gate.weightQ4_0[6144 16384]
-
blk.27.ffn_down.weightQ4_0[16384 6144]
-
blk.27.ffn_up.weightQ4_0[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.28.attn_output.weightQ4_0[6144 6144]
-
blk.28.attn_q.weightQ4_0[6144 6144]
-
blk.28.attn_k.weightQ4_0[6144 1024]
-
blk.28.attn_v.weightQ4_0[6144 1024]
-
blk.28.ffn_gate.weightQ4_0[6144 16384]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_down.weightQ4_0[16384 6144]
-
blk.28.ffn_up.weightQ4_0[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.29.attn_output.weightQ4_0[6144 6144]
-
blk.29.attn_q.weightQ4_0[6144 6144]
-
blk.29.attn_k.weightQ4_0[6144 1024]
-
blk.29.attn_v.weightQ4_0[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_gate.weightQ4_0[6144 16384]
-
blk.29.ffn_down.weightQ4_0[16384 6144]
-
blk.29.ffn_up.weightQ4_0[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.30.attn_output.weightQ4_0[6144 6144]
-
blk.30.attn_q.weightQ4_0[6144 6144]
-
blk.30.attn_k.weightQ4_0[6144 1024]
-
blk.30.attn_v.weightQ4_0[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_gate.weightQ4_0[6144 16384]
-
blk.30.ffn_down.weightQ4_0[16384 6144]
-
blk.30.ffn_up.weightQ4_0[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.31.attn_output.weightQ4_0[6144 6144]
-
blk.31.attn_q.weightQ4_0[6144 6144]
-
blk.31.attn_k.weightQ4_0[6144 1024]
-
blk.31.attn_v.weightQ4_0[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_gate.weightQ4_0[6144 16384]
-
blk.31.ffn_down.weightQ4_0[16384 6144]
-
blk.31.ffn_up.weightQ4_0[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.32.attn_output.weightQ4_0[6144 6144]
-
blk.32.attn_q.weightQ4_0[6144 6144]
-
blk.32.attn_k.weightQ4_0[6144 1024]
-
blk.32.attn_v.weightQ4_0[6144 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_gate.weightQ4_0[6144 16384]
-
blk.32.ffn_down.weightQ4_0[16384 6144]
-
blk.32.ffn_up.weightQ4_0[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.33.attn_output.weightQ4_0[6144 6144]
-
blk.33.attn_q.weightQ4_0[6144 6144]
-
blk.33.attn_k.weightQ4_0[6144 1024]
-
blk.33.attn_v.weightQ4_0[6144 1024]
-
blk.33.ffn_gate.weightQ4_0[6144 16384]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_down.weightQ4_0[16384 6144]
-
blk.33.ffn_up.weightQ4_0[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.34.attn_output.weightQ4_0[6144 6144]
-
blk.34.attn_q.weightQ4_0[6144 6144]
-
blk.34.attn_k.weightQ4_0[6144 1024]
-
blk.34.attn_v.weightQ4_0[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_gate.weightQ4_0[6144 16384]
-
blk.34.ffn_down.weightQ4_0[16384 6144]
-
blk.34.ffn_up.weightQ4_0[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.35.attn_output.weightQ4_0[6144 6144]
-
blk.35.attn_q.weightQ4_0[6144 6144]
-
blk.35.attn_k.weightQ4_0[6144 1024]
-
blk.35.attn_v.weightQ4_0[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_gate.weightQ4_0[6144 16384]
-
blk.35.ffn_down.weightQ4_0[16384 6144]
-
blk.35.ffn_up.weightQ4_0[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.36.attn_output.weightQ4_0[6144 6144]
-
blk.36.attn_q.weightQ4_0[6144 6144]
-
blk.36.attn_k.weightQ4_0[6144 1024]
-
blk.36.attn_v.weightQ4_0[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_gate.weightQ4_0[6144 16384]
-
blk.36.ffn_down.weightQ4_0[16384 6144]
-
blk.36.ffn_up.weightQ4_0[6144 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.37.attn_output.weightQ4_0[6144 6144]
-
blk.37.attn_q.weightQ4_0[6144 6144]
-
blk.37.attn_k.weightQ4_0[6144 1024]
-
blk.37.attn_v.weightQ4_0[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_gate.weightQ4_0[6144 16384]
-
blk.37.ffn_down.weightQ4_0[16384 6144]
-
blk.37.ffn_up.weightQ4_0[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.attn_output.weightQ4_0[6144 6144]
-
blk.38.attn_q.weightQ4_0[6144 6144]
-
blk.38.attn_k.weightQ4_0[6144 1024]
-
blk.38.attn_v.weightQ4_0[6144 1024]
-
blk.38.ffn_gate.weightQ4_0[6144 16384]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_down.weightQ4_0[16384 6144]
-
blk.38.ffn_up.weightQ4_0[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.39.attn_output.weightQ4_0[6144 6144]
-
blk.39.attn_q.weightQ4_0[6144 6144]
-
blk.39.attn_k.weightQ4_0[6144 1024]
-
blk.39.attn_v.weightQ4_0[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_gate.weightQ4_0[6144 16384]
-
blk.39.ffn_down.weightQ4_0[16384 6144]
-
blk.39.ffn_up.weightQ4_0[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.40.attn_output.weightQ4_0[6144 6144]
-
blk.40.attn_q.weightQ4_0[6144 6144]
-
blk.40.attn_k.weightQ4_0[6144 1024]
-
blk.40.attn_v.weightQ4_0[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_gate.weightQ4_0[6144 16384]
-
blk.40.ffn_down.weightQ4_0[16384 6144]
-
blk.40.ffn_up.weightQ4_0[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.41.attn_output.weightQ4_0[6144 6144]
-
blk.41.attn_q.weightQ4_0[6144 6144]
-
blk.41.attn_k.weightQ4_0[6144 1024]
-
blk.41.attn_v.weightQ4_0[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_gate.weightQ4_0[6144 16384]
-
blk.41.ffn_down.weightQ4_0[16384 6144]
-
blk.41.ffn_up.weightQ4_0[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.42.attn_output.weightQ4_0[6144 6144]
-
blk.42.attn_q.weightQ4_0[6144 6144]
-
blk.42.attn_k.weightQ4_0[6144 1024]
-
blk.42.attn_v.weightQ4_0[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_gate.weightQ4_0[6144 16384]
-
blk.42.ffn_down.weightQ4_0[16384 6144]
-
blk.42.ffn_up.weightQ4_0[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.43.attn_output.weightQ4_0[6144 6144]
-
blk.43.attn_q.weightQ4_0[6144 6144]
-
blk.43.attn_k.weightQ4_0[6144 1024]
-
blk.43.attn_v.weightQ4_0[6144 1024]
-
blk.43.ffn_gate.weightQ4_0[6144 16384]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_down.weightQ4_0[16384 6144]
-
blk.43.ffn_up.weightQ4_0[6144 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.attn_output.weightQ4_0[6144 6144]
-
blk.44.attn_q.weightQ4_0[6144 6144]
-
blk.44.attn_k.weightQ4_0[6144 1024]
-
blk.44.attn_v.weightQ4_0[6144 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_gate.weightQ4_0[6144 16384]
-
blk.44.ffn_down.weightQ4_0[16384 6144]
-
blk.44.ffn_up.weightQ4_0[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.45.attn_output.weightQ4_0[6144 6144]
-
blk.45.attn_q.weightQ4_0[6144 6144]
-
blk.45.attn_k.weightQ4_0[6144 1024]
-
blk.45.attn_v.weightQ4_0[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_gate.weightQ4_0[6144 16384]
-
blk.45.ffn_down.weightQ4_0[16384 6144]
-
blk.45.ffn_up.weightQ4_0[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.46.attn_output.weightQ4_0[6144 6144]
-
blk.46.attn_q.weightQ4_0[6144 6144]
-
blk.46.attn_k.weightQ4_0[6144 1024]
-
blk.46.attn_v.weightQ4_0[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_gate.weightQ4_0[6144 16384]
-
blk.46.ffn_down.weightQ4_0[16384 6144]
-
blk.46.ffn_up.weightQ4_0[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.47.attn_output.weightQ4_0[6144 6144]
-
blk.47.attn_q.weightQ4_0[6144 6144]
-
blk.47.attn_k.weightQ4_0[6144 1024]
-
blk.47.attn_v.weightQ4_0[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_gate.weightQ4_0[6144 16384]
-
blk.47.ffn_down.weightQ4_0[16384 6144]
-
blk.47.ffn_up.weightQ4_0[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
output_norm.weightF32[6144]
-
output.weightQ6_K[6144 92544]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47