InternLM2.5 has open-sourced a 20 billion parameter base model and a chat model tailored for practical scenarios.
281 Pulls Updated 3 months ago
fc350bfebd20 · 11GB
-
general.architectureinternlm2
-
general.file_type25
-
general.finetune..
-
general.licenseother
-
general.name..
-
general.quantization_version2
-
general.size_label20B
-
general.tags[text-generation]
-
general.typemodel
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base5e+07
-
quantize.imatrix.chunks_count136
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 20!)[6144, 92544]
-
blk.0.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.0.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.0.attn_v.weightQ5_K[6144, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.0.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.1.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.1.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.1.attn_v.weightQ5_K[6144, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.1.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.2.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.2.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.2.attn_v.weightQ5_K[6144, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.2.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.3.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.3.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.3.attn_v.weightQ5_K[6144, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.3.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.4.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.4.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.4.attn_v.weightQ5_K[6144, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.4.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.5.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.5.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.5.attn_v.weightQ5_K[6144, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.5.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.6.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.6.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.6.attn_v.weightQ5_K[6144, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.6.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.7.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.7.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.7.attn_v.weightQ5_K[6144, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.7.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.8.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.8.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.8.attn_v.weightQ5_K[6144, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.8.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.9.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.9.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.9.attn_v.weightQ5_K[6144, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.9.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.10.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.10.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.10.attn_v.weightQ5_K[6144, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.10.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.11.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.11.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.11.attn_v.weightQ5_K[6144, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.11.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.12.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.12.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.12.attn_v.weightQ5_K[6144, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.12.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.13.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.13.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.13.attn_v.weightQ5_K[6144, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.13.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.14.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.14.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.14.attn_v.weightQ5_K[6144, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.14.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.15.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.15.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.15.attn_v.weightQ5_K[6144, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.15.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.16.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.16.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.16.attn_v.weightQ5_K[6144, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.16.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.17.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.17.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.17.attn_v.weightQ5_K[6144, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.17.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.18.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.18.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.18.attn_v.weightQ5_K[6144, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.18.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.19.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.19.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.19.attn_v.weightQ5_K[6144, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.19.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.20.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.20.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.20.attn_v.weightQ5_K[6144, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.20.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.21.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.21.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.21.attn_v.weightQ5_K[6144, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.21.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.22.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.22.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.22.attn_v.weightQ5_K[6144, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.22.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.23.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.23.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.23.attn_v.weightQ5_K[6144, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.23.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.24.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.24.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.24.attn_v.weightQ5_K[6144, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.24.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.25.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.25.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.25.attn_v.weightQ5_K[6144, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.25.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.26.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.26.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.26.attn_v.weightQ5_K[6144, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.26.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.27.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.27.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.27.attn_v.weightQ5_K[6144, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.27.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.28.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.28.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.28.attn_v.weightQ5_K[6144, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.28.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.29.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.29.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.29.attn_v.weightQ5_K[6144, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.29.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.30.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.30.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.30.attn_v.weightQ5_K[6144, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.30.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.31.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.31.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.31.attn_v.weightQ5_K[6144, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.31.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.32.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.32.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.32.attn_v.weightQ5_K[6144, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.32.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.33.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.33.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.33.attn_v.weightQ5_K[6144, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.33.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.34.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.34.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.34.attn_v.weightQ5_K[6144, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.34.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.35.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.35.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.35.attn_v.weightQ5_K[6144, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.35.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.36.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.36.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.36.attn_v.weightQ5_K[6144, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.36.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.37.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.37.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.37.attn_v.weightQ5_K[6144, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.37.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.38.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.38.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.38.attn_v.weightQ5_K[6144, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.38.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.39.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.39.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.39.attn_v.weightQ5_K[6144, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.39.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.40.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.40.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.40.attn_v.weightQ5_K[6144, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.40.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.41.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.41.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.41.attn_v.weightQ5_K[6144, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.41.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.42.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.42.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.42.attn_v.weightQ5_K[6144, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.42.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.43.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.43.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.43.attn_v.weightQ5_K[6144, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.43.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.44.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.44.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.44.attn_v.weightQ5_K[6144, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.44.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.45.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.45.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.45.attn_v.weightQ5_K[6144, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.45.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.46.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.46.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.46.attn_v.weightQ5_K[6144, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.46.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
blk.47.attn_k.weight(!unknown_type 20!)[6144, 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.attn_output.weight(!unknown_type 20!)[6144, 6144]
-
blk.47.attn_q.weight(!unknown_type 20!)[6144, 6144]
-
blk.47.attn_v.weightQ5_K[6144, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[16384, 6144]
-
blk.47.ffn_gate.weight(!unknown_type 20!)[6144, 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.ffn_up.weight(!unknown_type 20!)[6144, 16384]
-
output.weightQ6_K[6144, 92544]
-
output_norm.weightF32[6144]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47