I-quants for qwen2.5-32b-instruct
Tools
32B
1 Pull Updated 2 hours ago
48f89b4e11bb · 9.0GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count448
-
quantize.imatrix.file/models_out/Qwen2.5-32B-Instruct-GGUF/Qwen2.5-32B-Instruct.imatrix
-
general.architectureqwen2
-
general.file_typeIQ2_XXS
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27648
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ2_K[27648 5120]
-
blk.0.ffn_gate.weightI8[5120 27648]
-
blk.0.ffn_up.weightI8[5120 27648]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightI8[5120 1024]
-
blk.0.attn_output.weightI8[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightI8[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ2_K[27648 5120]
-
blk.1.ffn_gate.weightI8[5120 27648]
-
blk.1.ffn_up.weightI8[5120 27648]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightI8[5120 1024]
-
blk.1.attn_output.weightI8[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightI8[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_up.weightI8[5120 27648]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightI8[5120 1024]
-
blk.2.attn_output.weightI8[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightI8[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.2.ffn_down.weightQ2_K[27648 5120]
-
blk.2.ffn_gate.weightI8[5120 27648]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ2_K[27648 5120]
-
blk.3.ffn_gate.weightI8[5120 27648]
-
blk.3.ffn_up.weightI8[5120 27648]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightI8[5120 1024]
-
blk.3.attn_output.weightI8[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightI8[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ2_K[27648 5120]
-
blk.4.ffn_gate.weightI8[5120 27648]
-
blk.4.ffn_up.weightI8[5120 27648]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightI8[5120 1024]
-
blk.4.attn_output.weightI8[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightI8[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ2_K[27648 5120]
-
blk.5.ffn_gate.weightI8[5120 27648]
-
blk.5.ffn_up.weightI8[5120 27648]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightI8[5120 1024]
-
blk.5.attn_output.weightI8[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightI8[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_up.weightI8[5120 27648]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightI8[5120 1024]
-
blk.6.attn_output.weightI8[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightI8[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.6.ffn_down.weightQ2_K[27648 5120]
-
blk.6.ffn_gate.weightI8[5120 27648]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ2_K[27648 5120]
-
blk.7.ffn_gate.weightI8[5120 27648]
-
blk.7.ffn_up.weightI8[5120 27648]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightI8[5120 1024]
-
blk.7.attn_output.weightI8[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightI8[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightI8[27648 5120]
-
blk.8.ffn_gate.weightI8[5120 27648]
-
blk.8.ffn_up.weightI8[5120 27648]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightI8[5120 1024]
-
blk.8.attn_output.weightI8[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightI8[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightI8[27648 5120]
-
blk.9.ffn_gate.weightI8[5120 27648]
-
blk.9.ffn_up.weightI8[5120 27648]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightI8[5120 1024]
-
blk.9.attn_output.weightI8[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightI8[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_up.weightI8[5120 27648]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightI8[5120 1024]
-
blk.10.attn_output.weightI8[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightI8[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.10.ffn_down.weightI8[27648 5120]
-
blk.10.ffn_gate.weightI8[5120 27648]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightI8[27648 5120]
-
blk.11.ffn_gate.weightI8[5120 27648]
-
blk.11.ffn_up.weightI8[5120 27648]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightI8[5120 1024]
-
blk.11.attn_output.weightI8[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightI8[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightI8[27648 5120]
-
blk.12.ffn_gate.weightI8[5120 27648]
-
blk.12.ffn_up.weightI8[5120 27648]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightI8[5120 1024]
-
blk.12.attn_output.weightI8[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightI8[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightI8[27648 5120]
-
blk.13.ffn_gate.weightI8[5120 27648]
-
blk.13.ffn_up.weightI8[5120 27648]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightI8[5120 1024]
-
blk.13.attn_output.weightI8[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightI8[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_up.weightI8[5120 27648]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightI8[5120 1024]
-
blk.14.attn_output.weightI8[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightI8[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.14.ffn_down.weightI8[27648 5120]
-
blk.14.ffn_gate.weightI8[5120 27648]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightI8[27648 5120]
-
blk.15.ffn_gate.weightI8[5120 27648]
-
blk.15.ffn_up.weightI8[5120 27648]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightI8[5120 1024]
-
blk.15.attn_output.weightI8[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightI8[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightI8[27648 5120]
-
blk.16.ffn_gate.weightI8[5120 27648]
-
blk.16.ffn_up.weightI8[5120 27648]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightI8[5120 1024]
-
blk.16.attn_output.weightI8[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightI8[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightI8[27648 5120]
-
blk.17.ffn_gate.weightI8[5120 27648]
-
blk.17.ffn_up.weightI8[5120 27648]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightI8[5120 1024]
-
blk.17.attn_output.weightI8[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightI8[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_up.weightI8[5120 27648]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightI8[5120 1024]
-
blk.18.attn_output.weightI8[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightI8[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.18.ffn_down.weightI8[27648 5120]
-
blk.18.ffn_gate.weightI8[5120 27648]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightI8[27648 5120]
-
blk.19.ffn_gate.weightI8[5120 27648]
-
blk.19.ffn_up.weightI8[5120 27648]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightI8[5120 1024]
-
blk.19.attn_output.weightI8[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightI8[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightI8[27648 5120]
-
blk.20.ffn_gate.weightI8[5120 27648]
-
blk.20.ffn_up.weightI8[5120 27648]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightI8[5120 1024]
-
blk.20.attn_output.weightI8[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightI8[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightI8[27648 5120]
-
blk.21.ffn_gate.weightI8[5120 27648]
-
blk.21.ffn_up.weightI8[5120 27648]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightI8[5120 1024]
-
blk.21.attn_output.weightI8[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightI8[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_up.weightI8[5120 27648]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightI8[5120 1024]
-
blk.22.attn_output.weightI8[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightI8[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.22.ffn_down.weightI8[27648 5120]
-
blk.22.ffn_gate.weightI8[5120 27648]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightI8[27648 5120]
-
blk.23.ffn_gate.weightI8[5120 27648]
-
blk.23.ffn_up.weightI8[5120 27648]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightI8[5120 1024]
-
blk.23.attn_output.weightI8[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightI8[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightI8[27648 5120]
-
blk.24.ffn_gate.weightI8[5120 27648]
-
blk.24.ffn_up.weightI8[5120 27648]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightI8[5120 1024]
-
blk.24.attn_output.weightI8[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightI8[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightI8[27648 5120]
-
blk.25.ffn_gate.weightI8[5120 27648]
-
blk.25.ffn_up.weightI8[5120 27648]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightI8[5120 1024]
-
blk.25.attn_output.weightI8[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightI8[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_up.weightI8[5120 27648]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightI8[5120 1024]
-
blk.26.attn_output.weightI8[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightI8[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.26.ffn_down.weightI8[27648 5120]
-
blk.26.ffn_gate.weightI8[5120 27648]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightI8[27648 5120]
-
blk.27.ffn_gate.weightI8[5120 27648]
-
blk.27.ffn_up.weightI8[5120 27648]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightI8[5120 1024]
-
blk.27.attn_output.weightI8[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightI8[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightI8[27648 5120]
-
blk.28.ffn_gate.weightI8[5120 27648]
-
blk.28.ffn_up.weightI8[5120 27648]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightI8[5120 1024]
-
blk.28.attn_output.weightI8[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightI8[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightI8[27648 5120]
-
blk.29.ffn_gate.weightI8[5120 27648]
-
blk.29.ffn_up.weightI8[5120 27648]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightI8[5120 1024]
-
blk.29.attn_output.weightI8[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightI8[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_up.weightI8[5120 27648]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightI8[5120 1024]
-
blk.30.attn_output.weightI8[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightI8[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.30.ffn_down.weightI8[27648 5120]
-
blk.30.ffn_gate.weightI8[5120 27648]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightI8[27648 5120]
-
blk.31.ffn_gate.weightI8[5120 27648]
-
blk.31.ffn_up.weightI8[5120 27648]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightI8[5120 1024]
-
blk.31.attn_output.weightI8[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightI8[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightI8[27648 5120]
-
blk.32.ffn_gate.weightI8[5120 27648]
-
blk.32.ffn_up.weightI8[5120 27648]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightI8[5120 1024]
-
blk.32.attn_output.weightI8[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightI8[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightI8[27648 5120]
-
blk.33.ffn_gate.weightI8[5120 27648]
-
blk.33.ffn_up.weightI8[5120 27648]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightI8[5120 1024]
-
blk.33.attn_output.weightI8[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightI8[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_up.weightI8[5120 27648]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightI8[5120 1024]
-
blk.34.attn_output.weightI8[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightI8[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.34.ffn_down.weightI8[27648 5120]
-
blk.34.ffn_gate.weightI8[5120 27648]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightI8[27648 5120]
-
blk.35.ffn_gate.weightI8[5120 27648]
-
blk.35.ffn_up.weightI8[5120 27648]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightI8[5120 1024]
-
blk.35.attn_output.weightI8[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightI8[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightI8[27648 5120]
-
blk.36.ffn_gate.weightI8[5120 27648]
-
blk.36.ffn_up.weightI8[5120 27648]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightI8[5120 1024]
-
blk.36.attn_output.weightI8[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightI8[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightI8[27648 5120]
-
blk.37.ffn_gate.weightI8[5120 27648]
-
blk.37.ffn_up.weightI8[5120 27648]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightI8[5120 1024]
-
blk.37.attn_output.weightI8[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightI8[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_up.weightI8[5120 27648]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightI8[5120 1024]
-
blk.38.attn_output.weightI8[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightI8[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.38.ffn_down.weightI8[27648 5120]
-
blk.38.ffn_gate.weightI8[5120 27648]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightI8[27648 5120]
-
blk.39.ffn_gate.weightI8[5120 27648]
-
blk.39.ffn_up.weightI8[5120 27648]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightI8[5120 1024]
-
blk.39.attn_output.weightI8[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightI8[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightI8[27648 5120]
-
blk.40.ffn_gate.weightI8[5120 27648]
-
blk.40.ffn_up.weightI8[5120 27648]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightI8[5120 1024]
-
blk.40.attn_output.weightI8[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightI8[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightI8[27648 5120]
-
blk.41.ffn_gate.weightI8[5120 27648]
-
blk.41.ffn_up.weightI8[5120 27648]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightI8[5120 1024]
-
blk.41.attn_output.weightI8[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightI8[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_up.weightI8[5120 27648]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightI8[5120 1024]
-
blk.42.attn_output.weightI8[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightI8[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[5120 1024]
-
blk.42.ffn_down.weightI8[27648 5120]
-
blk.42.ffn_gate.weightI8[5120 27648]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightI8[27648 5120]
-
blk.43.ffn_gate.weightI8[5120 27648]
-
blk.43.ffn_up.weightI8[5120 27648]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightI8[5120 1024]
-
blk.43.attn_output.weightI8[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightI8[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightI8[27648 5120]
-
blk.44.ffn_gate.weightI8[5120 27648]
-
blk.44.ffn_up.weightI8[5120 27648]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightI8[5120 1024]
-
blk.44.attn_output.weightI8[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightI8[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightI8[27648 5120]
-
blk.45.ffn_gate.weightI8[5120 27648]
-
blk.45.ffn_up.weightI8[5120 27648]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightI8[5120 1024]
-
blk.45.attn_output.weightI8[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightI8[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_up.weightI8[5120 27648]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightI8[5120 1024]
-
blk.46.attn_output.weightI8[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightI8[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[5120 1024]
-
blk.46.ffn_down.weightI8[27648 5120]
-
blk.46.ffn_gate.weightI8[5120 27648]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightI8[27648 5120]
-
blk.47.ffn_gate.weightI8[5120 27648]
-
blk.47.ffn_up.weightI8[5120 27648]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightI8[5120 1024]
-
blk.47.attn_output.weightI8[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightI8[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightI8[27648 5120]
-
blk.48.ffn_gate.weightI8[5120 27648]
-
blk.48.ffn_up.weightI8[5120 27648]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightI8[5120 1024]
-
blk.48.attn_output.weightI8[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightI8[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[5120 1024]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightI8[27648 5120]
-
blk.49.ffn_gate.weightI8[5120 27648]
-
blk.49.ffn_up.weightI8[5120 27648]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightI8[5120 1024]
-
blk.49.attn_output.weightI8[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightI8[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_up.weightI8[5120 27648]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightI8[5120 1024]
-
blk.50.attn_output.weightI8[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightI8[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[5120 1024]
-
blk.50.ffn_down.weightI8[27648 5120]
-
blk.50.ffn_gate.weightI8[5120 27648]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightI8[27648 5120]
-
blk.51.ffn_gate.weightI8[5120 27648]
-
blk.51.ffn_up.weightI8[5120 27648]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightI8[5120 1024]
-
blk.51.attn_output.weightI8[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightI8[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightI8[27648 5120]
-
blk.52.ffn_gate.weightI8[5120 27648]
-
blk.52.ffn_up.weightI8[5120 27648]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightI8[5120 1024]
-
blk.52.attn_output.weightI8[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightI8[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[5120 1024]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightI8[27648 5120]
-
blk.53.ffn_gate.weightI8[5120 27648]
-
blk.53.ffn_up.weightI8[5120 27648]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightI8[5120 1024]
-
blk.53.attn_output.weightI8[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightI8[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[5120 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_up.weightI8[5120 27648]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightI8[5120 1024]
-
blk.54.attn_output.weightI8[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightI8[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[5120 1024]
-
blk.54.ffn_down.weightI8[27648 5120]
-
blk.54.ffn_gate.weightI8[5120 27648]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightI8[27648 5120]
-
blk.55.ffn_gate.weightI8[5120 27648]
-
blk.55.ffn_up.weightI8[5120 27648]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightI8[5120 1024]
-
blk.55.attn_output.weightI8[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightI8[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightI8[27648 5120]
-
blk.56.ffn_gate.weightI8[5120 27648]
-
blk.56.ffn_up.weightI8[5120 27648]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightI8[5120 1024]
-
blk.56.attn_output.weightI8[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightI8[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[5120 1024]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightI8[27648 5120]
-
blk.57.ffn_gate.weightI8[5120 27648]
-
blk.57.ffn_up.weightI8[5120 27648]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightI8[5120 1024]
-
blk.57.attn_output.weightI8[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightI8[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_up.weightI8[5120 27648]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightI8[5120 1024]
-
blk.58.attn_output.weightI8[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightI8[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[5120 1024]
-
blk.58.ffn_down.weightI8[27648 5120]
-
blk.58.ffn_gate.weightI8[5120 27648]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightI8[27648 5120]
-
blk.59.ffn_gate.weightI8[5120 27648]
-
blk.59.ffn_up.weightI8[5120 27648]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightI8[5120 1024]
-
blk.59.attn_output.weightI8[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightI8[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightI8[27648 5120]
-
blk.60.ffn_gate.weightI8[5120 27648]
-
blk.60.ffn_up.weightI8[5120 27648]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightI8[5120 1024]
-
blk.60.attn_output.weightI8[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightI8[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[5120 1024]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightI8[27648 5120]
-
blk.61.ffn_gate.weightI8[5120 27648]
-
blk.61.ffn_up.weightI8[5120 27648]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightI8[5120 1024]
-
blk.61.attn_output.weightI8[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightI8[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_up.weightI8[5120 27648]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightI8[5120 1024]
-
blk.62.attn_output.weightI8[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightI8[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[5120 1024]
-
blk.62.ffn_down.weightI8[27648 5120]
-
blk.62.ffn_gate.weightI8[5120 27648]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightI8[27648 5120]
-
blk.63.ffn_gate.weightI8[5120 27648]
-
blk.63.ffn_up.weightI8[5120 27648]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightI8[5120 1024]
-
blk.63.attn_output.weightI8[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightI8[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[5120 1024]
-
output.weightQ5_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63