I-quants for qwen2.5-32b-instruct
tools
103 Pulls Updated 6 weeks ago
4f5c9155a41e · 11GB
-
general.architectureqwen2
-
general.base_model.0.nameQwen2.5 32B
-
general.base_model.0.organizationQwen
-
general.base_model.0.repo_urlhttps://huggingface.co/Qwen/Qwen2.5-32B
-
general.base_model.count1
-
general.basenameQwen2.5
-
general.file_type29
-
general.finetuneInstruct
-
general.languages[en]
-
general.licenseapache-2.0
-
general.license.linkhttps://huggingface.co/Qwen/Qwen2.5-32B-Instruct/blob/main/LICENSE
-
general.nameQwen2.5 32B Instruct
-
general.quantization_version2
-
general.size_label32B
-
general.tags[chat, text-generation]
-
general.typemodel
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/home/tyra/storage/quants/misc/calibration_datav3.txt
-
quantize.imatrix.entries_count448
-
quantize.imatrix.filegguf/Qwen2.5-32B-Instruct/imatrix.dat
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27648
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[5120, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[5120, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[5120, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[5120, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[5120, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[5120, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[5120, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[5120, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[27648, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[5120, 1024]
-
blk.8.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[5120, 1024]
-
blk.9.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[5120, 1024]
-
blk.10.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[5120, 1024]
-
blk.11.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[5120, 1024]
-
blk.12.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[5120, 1024]
-
blk.13.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[5120, 1024]
-
blk.14.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[5120, 1024]
-
blk.15.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[5120, 1024]
-
blk.16.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[5120, 1024]
-
blk.17.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[5120, 1024]
-
blk.18.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[5120, 1024]
-
blk.19.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[5120, 1024]
-
blk.20.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[5120, 1024]
-
blk.21.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[5120, 1024]
-
blk.22.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[5120, 1024]
-
blk.23.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[5120, 1024]
-
blk.24.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[5120, 1024]
-
blk.25.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[5120, 1024]
-
blk.26.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[5120, 1024]
-
blk.27.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[5120, 1024]
-
blk.28.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[5120, 1024]
-
blk.29.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[5120, 1024]
-
blk.30.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[5120, 1024]
-
blk.31.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[5120, 1024]
-
blk.32.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[5120, 1024]
-
blk.33.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[5120, 1024]
-
blk.34.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[5120, 1024]
-
blk.35.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[5120, 1024]
-
blk.36.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[5120, 1024]
-
blk.37.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[5120, 1024]
-
blk.38.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[5120, 1024]
-
blk.39.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[5120, 1024]
-
blk.40.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.40.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[5120, 1024]
-
blk.41.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.41.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[5120, 1024]
-
blk.42.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.42.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[5120, 1024]
-
blk.43.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.43.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[5120, 1024]
-
blk.44.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.44.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[5120, 1024]
-
blk.45.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.45.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[5120, 1024]
-
blk.46.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.46.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[5120, 1024]
-
blk.47.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.47.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[5120, 1024]
-
blk.48.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.48.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.48.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[5120, 1024]
-
blk.49.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.49.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[5120, 1024]
-
blk.50.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.50.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.50.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[5120, 1024]
-
blk.51.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.51.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[5120, 1024]
-
blk.52.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.52.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[5120, 1024]
-
blk.53.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.53.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[5120, 1024]
-
blk.54.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.54.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.54.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[5120, 1024]
-
blk.55.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.55.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[5120, 1024]
-
blk.56.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.56.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[5120, 1024]
-
blk.57.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.57.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[5120, 1024]
-
blk.58.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.58.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.58.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[5120, 1024]
-
blk.59.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.59.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[5120, 1024]
-
blk.60.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.60.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[5120, 1024]
-
blk.61.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.61.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[5120, 1024]
-
blk.62.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.62.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.62.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 22!)[5120, 1024]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[5120, 1024]
-
blk.63.ffn_down.weight(!unknown_type 22!)[27648, 5120]
-
blk.63.ffn_gate.weight(!unknown_type 22!)[5120, 27648]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.ffn_up.weight(!unknown_type 22!)[5120, 27648]
-
output.weightQ5_K[5120, 152064]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63