I-quants for qwen2.5-72b-instruct
Tools
72B
50 Pulls Updated 2 weeks ago
5d8386e3a446 · 25GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models_out/Qwen2.5-72B-Instruct-GGUF/Qwen2.5-72B-Instruct.imatrix
-
general.architectureqwen2
-
general.file_typeIQ2_XXS
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count80
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 152064]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_gate.weightI8[8192 29568]
-
blk.0.ffn_up.weightI8[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightI8[8192 1024]
-
blk.0.attn_output.weightI8[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightI8[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.ffn_gate.weightI8[8192 29568]
-
blk.1.ffn_up.weightI8[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightI8[8192 1024]
-
blk.1.attn_output.weightI8[8192 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightI8[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.2.ffn_gate.weightI8[8192 29568]
-
blk.2.ffn_up.weightI8[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightI8[8192 1024]
-
blk.2.attn_output.weightI8[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightI8[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.3.ffn_gate.weightI8[8192 29568]
-
blk.3.ffn_up.weightI8[8192 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightI8[8192 1024]
-
blk.3.attn_output.weightI8[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightI8[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.4.ffn_gate.weightI8[8192 29568]
-
blk.4.ffn_up.weightI8[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightI8[8192 1024]
-
blk.4.attn_output.weightI8[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightI8[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightI8[8192 1024]
-
blk.5.attn_output.weightI8[8192 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightI8[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.5.ffn_gate.weightI8[8192 29568]
-
blk.5.ffn_up.weightI8[8192 29568]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.6.ffn_gate.weightI8[8192 29568]
-
blk.6.ffn_up.weightI8[8192 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightI8[8192 1024]
-
blk.6.attn_output.weightI8[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightI8[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_up.weightI8[8192 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightI8[8192 1024]
-
blk.7.attn_output.weightI8[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightI8[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.7.ffn_gate.weightI8[8192 29568]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.8.ffn_gate.weightI8[8192 29568]
-
blk.8.ffn_up.weightI8[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightI8[8192 1024]
-
blk.8.attn_output.weightI8[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightI8[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_gate.weightI8[8192 29568]
-
blk.9.ffn_up.weightI8[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightI8[8192 1024]
-
blk.9.attn_output.weightI8[8192 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightI8[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.ffn_gate.weightI8[8192 29568]
-
blk.10.ffn_up.weightI8[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightI8[8192 1024]
-
blk.10.attn_output.weightI8[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightI8[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.11.ffn_gate.weightI8[8192 29568]
-
blk.11.ffn_up.weightI8[8192 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightI8[8192 1024]
-
blk.11.attn_output.weightI8[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightI8[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.12.ffn_gate.weightI8[8192 29568]
-
blk.12.ffn_up.weightI8[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightI8[8192 1024]
-
blk.12.attn_output.weightI8[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightI8[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.13.ffn_gate.weightI8[8192 29568]
-
blk.13.ffn_up.weightI8[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightI8[8192 1024]
-
blk.13.attn_output.weightI8[8192 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightI8[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightI8[8192 1024]
-
blk.14.attn_output.weightI8[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightI8[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.14.ffn_gate.weightI8[8192 29568]
-
blk.14.ffn_up.weightI8[8192 29568]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.15.ffn_gate.weightI8[8192 29568]
-
blk.15.ffn_up.weightI8[8192 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightI8[8192 1024]
-
blk.15.attn_output.weightI8[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightI8[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_up.weightI8[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightI8[8192 1024]
-
blk.16.attn_output.weightI8[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightI8[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.16.ffn_gate.weightI8[8192 29568]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.17.ffn_gate.weightI8[8192 29568]
-
blk.17.ffn_up.weightI8[8192 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightI8[8192 1024]
-
blk.17.attn_output.weightI8[8192 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightI8[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_gate.weightI8[8192 29568]
-
blk.18.ffn_up.weightI8[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightI8[8192 1024]
-
blk.18.attn_output.weightI8[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightI8[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.ffn_gate.weightI8[8192 29568]
-
blk.19.ffn_up.weightI8[8192 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightI8[8192 1024]
-
blk.19.attn_output.weightI8[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightI8[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.20.ffn_gate.weightI8[8192 29568]
-
blk.20.ffn_up.weightI8[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightI8[8192 1024]
-
blk.20.attn_output.weightI8[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightI8[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.21.ffn_gate.weightI8[8192 29568]
-
blk.21.ffn_up.weightI8[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightI8[8192 1024]
-
blk.21.attn_output.weightI8[8192 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightI8[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.22.ffn_gate.weightI8[8192 29568]
-
blk.22.ffn_up.weightI8[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightI8[8192 1024]
-
blk.22.attn_output.weightI8[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightI8[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightI8[8192 1024]
-
blk.23.attn_output.weightI8[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightI8[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.23.ffn_gate.weightI8[8192 29568]
-
blk.23.ffn_up.weightI8[8192 29568]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.24.ffn_gate.weightI8[8192 29568]
-
blk.24.ffn_up.weightI8[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightI8[8192 1024]
-
blk.24.attn_output.weightI8[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightI8[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_up.weightI8[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightI8[8192 1024]
-
blk.25.attn_output.weightI8[8192 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightI8[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.25.ffn_gate.weightI8[8192 29568]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.26.ffn_gate.weightI8[8192 29568]
-
blk.26.ffn_up.weightI8[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightI8[8192 1024]
-
blk.26.attn_output.weightI8[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightI8[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_gate.weightI8[8192 29568]
-
blk.27.ffn_up.weightI8[8192 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightI8[8192 1024]
-
blk.27.attn_output.weightI8[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightI8[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.ffn_gate.weightI8[8192 29568]
-
blk.28.ffn_up.weightI8[8192 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightI8[8192 1024]
-
blk.28.attn_output.weightI8[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightI8[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.29.ffn_gate.weightI8[8192 29568]
-
blk.29.ffn_up.weightI8[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightI8[8192 1024]
-
blk.29.attn_output.weightI8[8192 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightI8[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.30.ffn_gate.weightI8[8192 29568]
-
blk.30.ffn_up.weightI8[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightI8[8192 1024]
-
blk.30.attn_output.weightI8[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightI8[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.31.ffn_gate.weightI8[8192 29568]
-
blk.31.ffn_up.weightI8[8192 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightI8[8192 1024]
-
blk.31.attn_output.weightI8[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightI8[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightI8[8192 1024]
-
blk.32.attn_output.weightI8[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightI8[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.32.ffn_gate.weightI8[8192 29568]
-
blk.32.ffn_up.weightI8[8192 29568]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.33.ffn_gate.weightI8[8192 29568]
-
blk.33.ffn_up.weightI8[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightI8[8192 1024]
-
blk.33.attn_output.weightI8[8192 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightI8[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_up.weightI8[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightI8[8192 1024]
-
blk.34.attn_output.weightI8[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightI8[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.34.ffn_gate.weightI8[8192 29568]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.35.ffn_gate.weightI8[8192 29568]
-
blk.35.ffn_up.weightI8[8192 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightI8[8192 1024]
-
blk.35.attn_output.weightI8[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightI8[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_gate.weightI8[8192 29568]
-
blk.36.ffn_up.weightI8[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightI8[8192 1024]
-
blk.36.attn_output.weightI8[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightI8[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.ffn_gate.weightI8[8192 29568]
-
blk.37.ffn_up.weightI8[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightI8[8192 1024]
-
blk.37.attn_output.weightI8[8192 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightI8[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.38.ffn_gate.weightI8[8192 29568]
-
blk.38.ffn_up.weightI8[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightI8[8192 1024]
-
blk.38.attn_output.weightI8[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightI8[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.39.ffn_gate.weightI8[8192 29568]
-
blk.39.ffn_up.weightI8[8192 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightI8[8192 1024]
-
blk.39.attn_output.weightI8[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightI8[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.40.ffn_gate.weightI8[8192 29568]
-
blk.40.ffn_up.weightI8[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightI8[8192 1024]
-
blk.40.attn_output.weightI8[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightI8[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightI8[8192 1024]
-
blk.41.attn_output.weightI8[8192 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightI8[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.41.ffn_gate.weightI8[8192 29568]
-
blk.41.ffn_up.weightI8[8192 29568]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.42.ffn_gate.weightI8[8192 29568]
-
blk.42.ffn_up.weightI8[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightI8[8192 1024]
-
blk.42.attn_output.weightI8[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightI8[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_up.weightI8[8192 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightI8[8192 1024]
-
blk.43.attn_output.weightI8[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightI8[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.43.ffn_gate.weightI8[8192 29568]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.44.ffn_gate.weightI8[8192 29568]
-
blk.44.ffn_up.weightI8[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightI8[8192 1024]
-
blk.44.attn_output.weightI8[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightI8[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_gate.weightI8[8192 29568]
-
blk.45.ffn_up.weightI8[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightI8[8192 1024]
-
blk.45.attn_output.weightI8[8192 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightI8[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.ffn_gate.weightI8[8192 29568]
-
blk.46.ffn_up.weightI8[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightI8[8192 1024]
-
blk.46.attn_output.weightI8[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightI8[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.47.ffn_gate.weightI8[8192 29568]
-
blk.47.ffn_up.weightI8[8192 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightI8[8192 1024]
-
blk.47.attn_output.weightI8[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightI8[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.48.ffn_gate.weightI8[8192 29568]
-
blk.48.ffn_up.weightI8[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightI8[8192 1024]
-
blk.48.attn_output.weightI8[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightI8[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.49.ffn_gate.weightI8[8192 29568]
-
blk.49.ffn_up.weightI8[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightI8[8192 1024]
-
blk.49.attn_output.weightI8[8192 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightI8[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightI8[8192 1024]
-
blk.50.attn_output.weightI8[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightI8[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.50.ffn_gate.weightI8[8192 29568]
-
blk.50.ffn_up.weightI8[8192 29568]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.51.ffn_gate.weightI8[8192 29568]
-
blk.51.ffn_up.weightI8[8192 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightI8[8192 1024]
-
blk.51.attn_output.weightI8[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightI8[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_up.weightI8[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightI8[8192 1024]
-
blk.52.attn_output.weightI8[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightI8[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.52.ffn_gate.weightI8[8192 29568]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.53.ffn_gate.weightI8[8192 29568]
-
blk.53.ffn_up.weightI8[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightI8[8192 1024]
-
blk.53.attn_output.weightI8[8192 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightI8[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_gate.weightI8[8192 29568]
-
blk.54.ffn_up.weightI8[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightI8[8192 1024]
-
blk.54.attn_output.weightI8[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightI8[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.ffn_gate.weightI8[8192 29568]
-
blk.55.ffn_up.weightI8[8192 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightI8[8192 1024]
-
blk.55.attn_output.weightI8[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightI8[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.56.ffn_gate.weightI8[8192 29568]
-
blk.56.ffn_up.weightI8[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightI8[8192 1024]
-
blk.56.attn_output.weightI8[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightI8[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.57.ffn_gate.weightI8[8192 29568]
-
blk.57.ffn_up.weightI8[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightI8[8192 1024]
-
blk.57.attn_output.weightI8[8192 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightI8[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.58.ffn_gate.weightI8[8192 29568]
-
blk.58.ffn_up.weightI8[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightI8[8192 1024]
-
blk.58.attn_output.weightI8[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightI8[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightI8[8192 1024]
-
blk.59.attn_output.weightI8[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightI8[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.59.ffn_gate.weightI8[8192 29568]
-
blk.59.ffn_up.weightI8[8192 29568]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.60.ffn_gate.weightI8[8192 29568]
-
blk.60.ffn_up.weightI8[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightI8[8192 1024]
-
blk.60.attn_output.weightI8[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightI8[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_up.weightI8[8192 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightI8[8192 1024]
-
blk.61.attn_output.weightI8[8192 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightI8[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.61.ffn_gate.weightI8[8192 29568]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.62.ffn_gate.weightI8[8192 29568]
-
blk.62.ffn_up.weightI8[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightI8[8192 1024]
-
blk.62.attn_output.weightI8[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightI8[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_gate.weightI8[8192 29568]
-
blk.63.ffn_up.weightI8[8192 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightI8[8192 1024]
-
blk.63.attn_output.weightI8[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightI8[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.ffn_gate.weightI8[8192 29568]
-
blk.64.ffn_up.weightI8[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightI8[8192 1024]
-
blk.64.attn_output.weightI8[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightI8[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.65.ffn_gate.weightI8[8192 29568]
-
blk.65.ffn_up.weightI8[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightI8[8192 1024]
-
blk.65.attn_output.weightI8[8192 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightI8[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.66.ffn_gate.weightI8[8192 29568]
-
blk.66.ffn_up.weightI8[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightI8[8192 1024]
-
blk.66.attn_output.weightI8[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightI8[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.67.ffn_gate.weightI8[8192 29568]
-
blk.67.ffn_up.weightI8[8192 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightI8[8192 1024]
-
blk.67.attn_output.weightI8[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightI8[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightI8[8192 1024]
-
blk.68.attn_output.weightI8[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightI8[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.68.ffn_gate.weightI8[8192 29568]
-
blk.68.ffn_up.weightI8[8192 29568]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.69.ffn_gate.weightI8[8192 29568]
-
blk.69.ffn_up.weightI8[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightI8[8192 1024]
-
blk.69.attn_output.weightI8[8192 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightI8[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_up.weightI8[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightI8[8192 1024]
-
blk.70.attn_output.weightI8[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightI8[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.70.ffn_gate.weightI8[8192 29568]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.71.ffn_gate.weightI8[8192 29568]
-
blk.71.ffn_up.weightI8[8192 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightI8[8192 1024]
-
blk.71.attn_output.weightI8[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightI8[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_gate.weightI8[8192 29568]
-
blk.72.ffn_up.weightI8[8192 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightI8[8192 1024]
-
blk.72.attn_output.weightI8[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightI8[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.ffn_gate.weightI8[8192 29568]
-
blk.73.ffn_up.weightI8[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightI8[8192 1024]
-
blk.73.attn_output.weightI8[8192 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightI8[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.74.ffn_gate.weightI8[8192 29568]
-
blk.74.ffn_up.weightI8[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightI8[8192 1024]
-
blk.74.attn_output.weightI8[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightI8[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.75.ffn_gate.weightI8[8192 29568]
-
blk.75.ffn_up.weightI8[8192 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightI8[8192 1024]
-
blk.75.attn_output.weightI8[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightI8[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.76.ffn_gate.weightI8[8192 29568]
-
blk.76.ffn_up.weightI8[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightI8[8192 1024]
-
blk.76.attn_output.weightI8[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightI8[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightI8[8192 1024]
-
blk.77.attn_output.weightI8[8192 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightI8[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.77.ffn_gate.weightI8[8192 29568]
-
blk.77.ffn_up.weightI8[8192 29568]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.78.ffn_gate.weightI8[8192 29568]
-
blk.78.ffn_up.weightI8[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightI8[8192 1024]
-
blk.78.attn_output.weightI8[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightI8[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_up.weightI8[8192 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightI8[8192 1024]
-
blk.79.attn_output.weightI8[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightI8[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.79.ffn_gate.weightI8[8192 29568]
-
output.weightQ5_K[8192 152064]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79