InternLM2.5 has open-sourced a 20 billion parameter base model and a chat model tailored for practical scenarios.
281 Pulls Updated 3 months ago
54bac32fc612 · 8.8GB
-
general.architectureinternlm2
-
general.file_type26
-
general.finetune..
-
general.licenseother
-
general.name..
-
general.quantization_version2
-
general.size_label20B
-
general.tags[text-generation]
-
general.typemodel
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base5e+07
-
quantize.imatrix.chunks_count136
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[6144, 92544]
-
blk.0.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.0.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.0.attn_v.weightQ4_K[6144, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.1.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.1.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.1.attn_v.weightQ4_K[6144, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.2.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.2.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.2.attn_v.weightQ4_K[6144, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.3.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.3.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.3.attn_v.weightQ4_K[6144, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.4.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.4.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.4.attn_v.weightQ4_K[6144, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.5.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.5.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.5.attn_v.weightQ4_K[6144, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.6.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.6.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.6.attn_v.weightQ4_K[6144, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.7.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.7.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.7.attn_v.weightQ4_K[6144, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.8.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.8.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.8.attn_v.weightQ4_K[6144, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.9.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.9.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.9.attn_v.weightQ4_K[6144, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.10.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.10.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.10.attn_v.weightQ4_K[6144, 1024]
-
blk.10.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.11.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.11.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.11.attn_v.weightQ4_K[6144, 1024]
-
blk.11.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.12.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.12.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.12.attn_v.weightQ4_K[6144, 1024]
-
blk.12.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.13.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.13.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.13.attn_v.weightQ4_K[6144, 1024]
-
blk.13.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.14.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.14.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.14.attn_v.weightQ4_K[6144, 1024]
-
blk.14.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.15.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.15.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.15.attn_v.weightQ4_K[6144, 1024]
-
blk.15.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.16.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.16.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.16.attn_v.weightQ4_K[6144, 1024]
-
blk.16.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.17.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.17.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.17.attn_v.weightQ4_K[6144, 1024]
-
blk.17.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.18.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.18.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.18.attn_v.weightQ4_K[6144, 1024]
-
blk.18.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.19.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.19.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.19.attn_v.weightQ4_K[6144, 1024]
-
blk.19.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.20.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.20.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.20.attn_v.weightQ4_K[6144, 1024]
-
blk.20.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.21.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.21.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.21.attn_v.weightQ4_K[6144, 1024]
-
blk.21.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.22.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.22.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.22.attn_v.weightQ4_K[6144, 1024]
-
blk.22.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.23.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.23.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.23.attn_v.weightQ4_K[6144, 1024]
-
blk.23.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.24.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.24.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.24.attn_v.weightQ4_K[6144, 1024]
-
blk.24.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.25.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.25.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.25.attn_v.weightQ4_K[6144, 1024]
-
blk.25.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.26.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.26.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.26.attn_v.weightQ4_K[6144, 1024]
-
blk.26.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.27.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.27.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.27.attn_v.weightQ4_K[6144, 1024]
-
blk.27.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.28.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.28.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.28.attn_v.weightQ4_K[6144, 1024]
-
blk.28.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.29.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.29.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.29.attn_v.weightQ4_K[6144, 1024]
-
blk.29.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.30.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.30.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.30.attn_v.weightQ4_K[6144, 1024]
-
blk.30.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.31.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.31.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.31.attn_v.weightQ4_K[6144, 1024]
-
blk.31.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.32.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.32.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.32.attn_v.weightQ4_K[6144, 1024]
-
blk.32.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.33.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.33.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.33.attn_v.weightQ4_K[6144, 1024]
-
blk.33.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.34.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.34.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.34.attn_v.weightQ4_K[6144, 1024]
-
blk.34.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.35.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.35.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.35.attn_v.weightQ4_K[6144, 1024]
-
blk.35.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.36.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.36.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.36.attn_v.weightQ4_K[6144, 1024]
-
blk.36.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.37.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.37.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.37.attn_v.weightQ4_K[6144, 1024]
-
blk.37.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.38.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.38.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.38.attn_v.weightQ4_K[6144, 1024]
-
blk.38.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.39.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.39.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.39.attn_v.weightQ4_K[6144, 1024]
-
blk.39.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.40.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.40.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.40.attn_v.weightQ4_K[6144, 1024]
-
blk.40.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.40.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.41.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.41.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.41.attn_v.weightQ4_K[6144, 1024]
-
blk.41.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.41.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.42.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.42.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.42.attn_v.weightQ4_K[6144, 1024]
-
blk.42.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.42.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.43.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.43.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.43.attn_v.weightQ4_K[6144, 1024]
-
blk.43.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.43.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.44.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.44.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.44.attn_v.weightQ4_K[6144, 1024]
-
blk.44.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.44.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.45.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.45.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.45.attn_v.weightQ4_K[6144, 1024]
-
blk.45.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.45.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.46.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.46.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.46.attn_v.weightQ4_K[6144, 1024]
-
blk.46.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.46.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
blk.47.attn_k.weight(!unknown_type 21!)[6144, 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.47.attn_q.weight(!unknown_type 21!)[6144, 6144]
-
blk.47.attn_v.weightQ4_K[6144, 1024]
-
blk.47.ffn_down.weight(!unknown_type 21!)[16384, 6144]
-
blk.47.ffn_gate.weight(!unknown_type 21!)[6144, 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.ffn_up.weight(!unknown_type 21!)[6144, 16384]
-
output.weightQ6_K[6144, 92544]
-
output_norm.weightF32[6144]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47