latest
24GB
Tools
32B
15 Pulls Updated 2 weeks ago
87eabadf5b40 · 24GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count448
-
quantize.imatrix.file/models_out/Replete-LLM-V2.5-Qwen-32b-GGUF/Replete-LLM-V2.5-Qwen-32b.imatrix
-
general.architectureqwen2
-
general.file_typeQ5_K_M
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27648
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ8_0[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[27648 5120]
-
blk.0.ffn_gate.weightQ5_K[5120 27648]
-
blk.0.ffn_up.weightQ5_K[5120 27648]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ5_K[5120 1024]
-
blk.0.attn_output.weightQ5_K[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightQ5_K[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ6_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[27648 5120]
-
blk.1.ffn_gate.weightQ5_K[5120 27648]
-
blk.1.ffn_up.weightQ5_K[5120 27648]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ5_K[5120 1024]
-
blk.1.attn_output.weightQ5_K[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightQ5_K[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ6_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ5_K[27648 5120]
-
blk.2.ffn_gate.weightQ5_K[5120 27648]
-
blk.2.ffn_up.weightQ5_K[5120 27648]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ5_K[5120 1024]
-
blk.2.attn_output.weightQ5_K[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightQ5_K[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ5_K[27648 5120]
-
blk.3.ffn_gate.weightQ5_K[5120 27648]
-
blk.3.ffn_up.weightQ5_K[5120 27648]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ5_K[5120 1024]
-
blk.3.attn_output.weightQ5_K[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightQ5_K[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[27648 5120]
-
blk.4.ffn_gate.weightQ5_K[5120 27648]
-
blk.4.ffn_up.weightQ5_K[5120 27648]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ5_K[5120 1024]
-
blk.4.attn_output.weightQ5_K[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightQ5_K[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ6_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ5_K[27648 5120]
-
blk.5.ffn_gate.weightQ5_K[5120 27648]
-
blk.5.ffn_up.weightQ5_K[5120 27648]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ5_K[5120 1024]
-
blk.5.attn_output.weightQ5_K[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightQ5_K[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ6_K[27648 5120]
-
blk.6.ffn_gate.weightQ5_K[5120 27648]
-
blk.6.ffn_up.weightQ5_K[5120 27648]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ5_K[5120 1024]
-
blk.6.attn_output.weightQ5_K[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightQ5_K[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ6_K[5120 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ6_K[27648 5120]
-
blk.7.ffn_gate.weightQ5_K[5120 27648]
-
blk.7.ffn_up.weightQ5_K[5120 27648]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ5_K[5120 1024]
-
blk.7.attn_output.weightQ5_K[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightQ5_K[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ6_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ6_K[27648 5120]
-
blk.8.ffn_gate.weightQ5_K[5120 27648]
-
blk.8.ffn_up.weightQ5_K[5120 27648]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ5_K[5120 1024]
-
blk.8.attn_output.weightQ5_K[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightQ5_K[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ6_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ6_K[27648 5120]
-
blk.9.ffn_gate.weightQ5_K[5120 27648]
-
blk.9.ffn_up.weightQ5_K[5120 27648]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ5_K[5120 1024]
-
blk.9.attn_output.weightQ5_K[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightQ5_K[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ6_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ6_K[27648 5120]
-
blk.10.ffn_gate.weightQ5_K[5120 27648]
-
blk.10.ffn_up.weightQ5_K[5120 27648]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ5_K[5120 1024]
-
blk.10.attn_output.weightQ5_K[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightQ5_K[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ6_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[27648 5120]
-
blk.11.ffn_gate.weightQ5_K[5120 27648]
-
blk.11.ffn_up.weightQ5_K[5120 27648]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ5_K[5120 1024]
-
blk.11.attn_output.weightQ5_K[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightQ5_K[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ6_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ6_K[27648 5120]
-
blk.12.ffn_gate.weightQ5_K[5120 27648]
-
blk.12.ffn_up.weightQ5_K[5120 27648]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ5_K[5120 1024]
-
blk.12.attn_output.weightQ5_K[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightQ5_K[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ6_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ6_K[27648 5120]
-
blk.13.ffn_gate.weightQ5_K[5120 27648]
-
blk.13.ffn_up.weightQ5_K[5120 27648]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ5_K[5120 1024]
-
blk.13.attn_output.weightQ5_K[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightQ5_K[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ6_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ6_K[27648 5120]
-
blk.14.ffn_gate.weightQ5_K[5120 27648]
-
blk.14.ffn_up.weightQ5_K[5120 27648]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ5_K[5120 1024]
-
blk.14.attn_output.weightQ5_K[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightQ5_K[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ6_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ6_K[27648 5120]
-
blk.15.ffn_gate.weightQ5_K[5120 27648]
-
blk.15.ffn_up.weightQ5_K[5120 27648]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ5_K[5120 1024]
-
blk.15.attn_output.weightQ5_K[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightQ5_K[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ6_K[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ5_K[27648 5120]
-
blk.16.ffn_gate.weightQ5_K[5120 27648]
-
blk.16.ffn_up.weightQ5_K[5120 27648]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ5_K[5120 1024]
-
blk.16.attn_output.weightQ5_K[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightQ5_K[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ5_K[27648 5120]
-
blk.17.ffn_gate.weightQ5_K[5120 27648]
-
blk.17.ffn_up.weightQ5_K[5120 27648]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ5_K[5120 1024]
-
blk.17.attn_output.weightQ5_K[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightQ5_K[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ6_K[27648 5120]
-
blk.18.ffn_gate.weightQ5_K[5120 27648]
-
blk.18.ffn_up.weightQ5_K[5120 27648]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ5_K[5120 1024]
-
blk.18.attn_output.weightQ5_K[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightQ5_K[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ6_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ5_K[27648 5120]
-
blk.19.ffn_gate.weightQ5_K[5120 27648]
-
blk.19.ffn_up.weightQ5_K[5120 27648]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ5_K[5120 1024]
-
blk.19.attn_output.weightQ5_K[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightQ5_K[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ6_K[27648 5120]
-
blk.20.ffn_gate.weightQ5_K[5120 27648]
-
blk.20.ffn_up.weightQ5_K[5120 27648]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ5_K[5120 1024]
-
blk.20.attn_output.weightQ5_K[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightQ5_K[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ6_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ5_K[27648 5120]
-
blk.21.ffn_gate.weightQ5_K[5120 27648]
-
blk.21.ffn_up.weightQ5_K[5120 27648]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ5_K[5120 1024]
-
blk.21.attn_output.weightQ5_K[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightQ5_K[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ5_K[27648 5120]
-
blk.22.ffn_gate.weightQ5_K[5120 27648]
-
blk.22.ffn_up.weightQ5_K[5120 27648]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ5_K[5120 1024]
-
blk.22.attn_output.weightQ5_K[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightQ5_K[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ6_K[27648 5120]
-
blk.23.ffn_gate.weightQ5_K[5120 27648]
-
blk.23.ffn_up.weightQ5_K[5120 27648]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ5_K[5120 1024]
-
blk.23.attn_output.weightQ5_K[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightQ5_K[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ6_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ5_K[27648 5120]
-
blk.24.ffn_gate.weightQ5_K[5120 27648]
-
blk.24.ffn_up.weightQ5_K[5120 27648]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ5_K[5120 1024]
-
blk.24.attn_output.weightQ5_K[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightQ5_K[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ5_K[27648 5120]
-
blk.25.ffn_gate.weightQ5_K[5120 27648]
-
blk.25.ffn_up.weightQ5_K[5120 27648]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ5_K[5120 1024]
-
blk.25.attn_output.weightQ5_K[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightQ5_K[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ6_K[27648 5120]
-
blk.26.ffn_gate.weightQ5_K[5120 27648]
-
blk.26.ffn_up.weightQ5_K[5120 27648]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ5_K[5120 1024]
-
blk.26.attn_output.weightQ5_K[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightQ5_K[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ6_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ5_K[27648 5120]
-
blk.27.ffn_gate.weightQ5_K[5120 27648]
-
blk.27.ffn_up.weightQ5_K[5120 27648]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ5_K[5120 1024]
-
blk.27.attn_output.weightQ5_K[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightQ5_K[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ5_K[27648 5120]
-
blk.28.ffn_gate.weightQ5_K[5120 27648]
-
blk.28.ffn_up.weightQ5_K[5120 27648]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ5_K[5120 1024]
-
blk.28.attn_output.weightQ5_K[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightQ5_K[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ6_K[27648 5120]
-
blk.29.ffn_gate.weightQ5_K[5120 27648]
-
blk.29.ffn_up.weightQ5_K[5120 27648]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ5_K[5120 1024]
-
blk.29.attn_output.weightQ5_K[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightQ5_K[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ6_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ5_K[27648 5120]
-
blk.30.ffn_gate.weightQ5_K[5120 27648]
-
blk.30.ffn_up.weightQ5_K[5120 27648]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ5_K[5120 1024]
-
blk.30.attn_output.weightQ5_K[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightQ5_K[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[27648 5120]
-
blk.31.ffn_gate.weightQ5_K[5120 27648]
-
blk.31.ffn_up.weightQ5_K[5120 27648]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ5_K[5120 1024]
-
blk.31.attn_output.weightQ5_K[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightQ5_K[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ6_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ5_K[27648 5120]
-
blk.32.ffn_gate.weightQ5_K[5120 27648]
-
blk.32.ffn_up.weightQ5_K[5120 27648]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ5_K[5120 1024]
-
blk.32.attn_output.weightQ5_K[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightQ5_K[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ5_K[27648 5120]
-
blk.33.ffn_gate.weightQ5_K[5120 27648]
-
blk.33.ffn_up.weightQ5_K[5120 27648]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ5_K[5120 1024]
-
blk.33.attn_output.weightQ5_K[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightQ5_K[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[27648 5120]
-
blk.34.ffn_gate.weightQ5_K[5120 27648]
-
blk.34.ffn_up.weightQ5_K[5120 27648]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ5_K[5120 1024]
-
blk.34.attn_output.weightQ5_K[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightQ5_K[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ6_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ5_K[27648 5120]
-
blk.35.ffn_gate.weightQ5_K[5120 27648]
-
blk.35.ffn_up.weightQ5_K[5120 27648]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ5_K[5120 1024]
-
blk.35.attn_output.weightQ5_K[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightQ5_K[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ5_K[27648 5120]
-
blk.36.ffn_gate.weightQ5_K[5120 27648]
-
blk.36.ffn_up.weightQ5_K[5120 27648]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ5_K[5120 1024]
-
blk.36.attn_output.weightQ5_K[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightQ5_K[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[27648 5120]
-
blk.37.ffn_gate.weightQ5_K[5120 27648]
-
blk.37.ffn_up.weightQ5_K[5120 27648]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ5_K[5120 1024]
-
blk.37.attn_output.weightQ5_K[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightQ5_K[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ6_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ5_K[27648 5120]
-
blk.38.ffn_gate.weightQ5_K[5120 27648]
-
blk.38.ffn_up.weightQ5_K[5120 27648]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ5_K[5120 1024]
-
blk.38.attn_output.weightQ5_K[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightQ5_K[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ5_K[27648 5120]
-
blk.39.ffn_gate.weightQ5_K[5120 27648]
-
blk.39.ffn_up.weightQ5_K[5120 27648]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ5_K[5120 1024]
-
blk.39.attn_output.weightQ5_K[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightQ5_K[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightQ5_K[27648 5120]
-
blk.40.ffn_gate.weightQ5_K[5120 27648]
-
blk.40.ffn_up.weightQ5_K[5120 27648]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ5_K[5120 1024]
-
blk.40.attn_output.weightQ5_K[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightQ5_K[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightQ5_K[27648 5120]
-
blk.41.ffn_gate.weightQ5_K[5120 27648]
-
blk.41.ffn_up.weightQ5_K[5120 27648]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ5_K[5120 1024]
-
blk.41.attn_output.weightQ5_K[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightQ5_K[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightQ6_K[27648 5120]
-
blk.42.ffn_gate.weightQ5_K[5120 27648]
-
blk.42.ffn_up.weightQ5_K[5120 27648]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ5_K[5120 1024]
-
blk.42.attn_output.weightQ5_K[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightQ5_K[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ6_K[5120 1024]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightQ5_K[27648 5120]
-
blk.43.ffn_gate.weightQ5_K[5120 27648]
-
blk.43.ffn_up.weightQ5_K[5120 27648]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ5_K[5120 1024]
-
blk.43.attn_output.weightQ5_K[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightQ5_K[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightQ5_K[27648 5120]
-
blk.44.ffn_gate.weightQ5_K[5120 27648]
-
blk.44.ffn_up.weightQ5_K[5120 27648]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ5_K[5120 1024]
-
blk.44.attn_output.weightQ5_K[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightQ5_K[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightQ6_K[27648 5120]
-
blk.45.ffn_gate.weightQ5_K[5120 27648]
-
blk.45.ffn_up.weightQ5_K[5120 27648]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ5_K[5120 1024]
-
blk.45.attn_output.weightQ5_K[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightQ5_K[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ6_K[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightQ5_K[27648 5120]
-
blk.46.ffn_gate.weightQ5_K[5120 27648]
-
blk.46.ffn_up.weightQ5_K[5120 27648]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ5_K[5120 1024]
-
blk.46.attn_output.weightQ5_K[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightQ5_K[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[5120 1024]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightQ5_K[27648 5120]
-
blk.47.ffn_gate.weightQ5_K[5120 27648]
-
blk.47.ffn_up.weightQ5_K[5120 27648]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ5_K[5120 1024]
-
blk.47.attn_output.weightQ5_K[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightQ5_K[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightQ6_K[27648 5120]
-
blk.48.ffn_gate.weightQ5_K[5120 27648]
-
blk.48.ffn_up.weightQ5_K[5120 27648]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ5_K[5120 1024]
-
blk.48.attn_output.weightQ5_K[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightQ5_K[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ6_K[5120 1024]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightQ5_K[27648 5120]
-
blk.49.ffn_gate.weightQ5_K[5120 27648]
-
blk.49.ffn_up.weightQ5_K[5120 27648]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ5_K[5120 1024]
-
blk.49.attn_output.weightQ5_K[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightQ5_K[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightQ6_K[27648 5120]
-
blk.50.ffn_gate.weightQ5_K[5120 27648]
-
blk.50.ffn_up.weightQ5_K[5120 27648]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ5_K[5120 1024]
-
blk.50.attn_output.weightQ5_K[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightQ5_K[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ6_K[5120 1024]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightQ5_K[27648 5120]
-
blk.51.ffn_gate.weightQ5_K[5120 27648]
-
blk.51.ffn_up.weightQ5_K[5120 27648]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ5_K[5120 1024]
-
blk.51.attn_output.weightQ5_K[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightQ5_K[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightQ5_K[27648 5120]
-
blk.52.ffn_gate.weightQ5_K[5120 27648]
-
blk.52.ffn_up.weightQ5_K[5120 27648]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ5_K[5120 1024]
-
blk.52.attn_output.weightQ5_K[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightQ5_K[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[5120 1024]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightQ6_K[27648 5120]
-
blk.53.ffn_gate.weightQ5_K[5120 27648]
-
blk.53.ffn_up.weightQ5_K[5120 27648]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ5_K[5120 1024]
-
blk.53.attn_output.weightQ5_K[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightQ5_K[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ6_K[5120 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightQ5_K[27648 5120]
-
blk.54.ffn_gate.weightQ5_K[5120 27648]
-
blk.54.ffn_up.weightQ5_K[5120 27648]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ5_K[5120 1024]
-
blk.54.attn_output.weightQ5_K[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightQ5_K[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[5120 1024]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightQ5_K[27648 5120]
-
blk.55.ffn_gate.weightQ5_K[5120 27648]
-
blk.55.ffn_up.weightQ5_K[5120 27648]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ5_K[5120 1024]
-
blk.55.attn_output.weightQ5_K[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightQ5_K[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightQ6_K[27648 5120]
-
blk.56.ffn_gate.weightQ5_K[5120 27648]
-
blk.56.ffn_up.weightQ5_K[5120 27648]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ5_K[5120 1024]
-
blk.56.attn_output.weightQ5_K[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightQ5_K[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ6_K[5120 1024]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightQ5_K[27648 5120]
-
blk.57.ffn_gate.weightQ5_K[5120 27648]
-
blk.57.ffn_up.weightQ5_K[5120 27648]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ5_K[5120 1024]
-
blk.57.attn_output.weightQ5_K[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightQ5_K[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightQ5_K[27648 5120]
-
blk.58.ffn_gate.weightQ5_K[5120 27648]
-
blk.58.ffn_up.weightQ5_K[5120 27648]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ5_K[5120 1024]
-
blk.58.attn_output.weightQ5_K[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightQ5_K[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[5120 1024]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightQ6_K[27648 5120]
-
blk.59.ffn_gate.weightQ5_K[5120 27648]
-
blk.59.ffn_up.weightQ5_K[5120 27648]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ5_K[5120 1024]
-
blk.59.attn_output.weightQ5_K[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightQ5_K[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ6_K[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightQ6_K[27648 5120]
-
blk.60.ffn_gate.weightQ5_K[5120 27648]
-
blk.60.ffn_up.weightQ5_K[5120 27648]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ5_K[5120 1024]
-
blk.60.attn_output.weightQ5_K[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightQ5_K[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ6_K[5120 1024]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightQ6_K[27648 5120]
-
blk.61.ffn_gate.weightQ5_K[5120 27648]
-
blk.61.ffn_up.weightQ5_K[5120 27648]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ5_K[5120 1024]
-
blk.61.attn_output.weightQ5_K[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightQ5_K[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ6_K[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightQ6_K[27648 5120]
-
blk.62.ffn_gate.weightQ5_K[5120 27648]
-
blk.62.ffn_up.weightQ5_K[5120 27648]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ5_K[5120 1024]
-
blk.62.attn_output.weightQ5_K[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightQ5_K[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ6_K[5120 1024]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightQ6_K[27648 5120]
-
blk.63.ffn_gate.weightQ5_K[5120 27648]
-
blk.63.ffn_up.weightQ5_K[5120 27648]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ5_K[5120 1024]
-
blk.63.attn_output.weightQ5_K[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightQ5_K[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ6_K[5120 1024]
-
output.weightQ8_0[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63