Tess-v2.5 (Qwen2-72B) was fine-tuned over the newly released Qwen2-72B base, using the Tess-v2.5 dataset that contain 300K samples spanning multiple topics.
102 Pulls Updated 3 months ago
c152f761df41 · 30GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models/Tess-v2.5-Qwen2-72B-GGUF/Tess-v2.5-Qwen2-72B.imatrix
-
general.architectureqwen2
-
general.file_typeQ2_K
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-05
-
qwen2.block_count80
-
qwen2.context_length131072
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151646
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 152064]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.0.ffn_gate.weightQ2_K[8192 29568]
-
blk.0.ffn_up.weightQ2_K[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ2_K[8192 1024]
-
blk.0.attn_output.weightQ3_K[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightQ2_K[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192 1024]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ2_K[8192 1024]
-
blk.1.attn_output.weightQ3_K[8192 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightQ2_K[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.ffn_gate.weightQ2_K[8192 29568]
-
blk.1.ffn_up.weightQ2_K[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.2.ffn_gate.weightQ2_K[8192 29568]
-
blk.2.ffn_up.weightQ2_K[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ2_K[8192 1024]
-
blk.2.attn_output.weightQ3_K[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightQ2_K[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.3.ffn_gate.weightQ2_K[8192 29568]
-
blk.3.ffn_up.weightQ2_K[8192 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ2_K[8192 1024]
-
blk.3.attn_output.weightQ3_K[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightQ2_K[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.4.ffn_gate.weightQ2_K[8192 29568]
-
blk.4.ffn_up.weightQ2_K[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ2_K[8192 1024]
-
blk.4.attn_output.weightQ3_K[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightQ2_K[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.5.ffn_gate.weightQ2_K[8192 29568]
-
blk.5.ffn_up.weightQ2_K[8192 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ2_K[8192 1024]
-
blk.5.attn_output.weightQ3_K[8192 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightQ2_K[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192 1024]
-
blk.6.ffn_gate.weightQ2_K[8192 29568]
-
blk.6.ffn_up.weightQ2_K[8192 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ2_K[8192 1024]
-
blk.6.attn_output.weightQ3_K[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightQ2_K[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.7.ffn_gate.weightQ2_K[8192 29568]
-
blk.7.ffn_up.weightQ2_K[8192 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ2_K[8192 1024]
-
blk.7.attn_output.weightQ3_K[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightQ2_K[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.8.ffn_gate.weightQ2_K[8192 29568]
-
blk.8.ffn_up.weightQ2_K[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ2_K[8192 1024]
-
blk.8.attn_output.weightQ3_K[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightQ2_K[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192 1024]
-
blk.9.ffn_gate.weightQ2_K[8192 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ2_K[8192 1024]
-
blk.9.attn_output.weightQ3_K[8192 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightQ2_K[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.9.ffn_up.weightQ2_K[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.ffn_gate.weightQ2_K[8192 29568]
-
blk.10.ffn_up.weightQ2_K[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ2_K[8192 1024]
-
blk.10.attn_output.weightQ3_K[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightQ2_K[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.11.ffn_gate.weightQ2_K[8192 29568]
-
blk.11.ffn_up.weightQ2_K[8192 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ2_K[8192 1024]
-
blk.11.attn_output.weightQ3_K[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightQ2_K[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192 1024]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ2_K[8192 1024]
-
blk.12.attn_output.weightQ3_K[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightQ2_K[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.12.ffn_gate.weightQ2_K[8192 29568]
-
blk.12.ffn_up.weightQ2_K[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.13.ffn_gate.weightQ2_K[8192 29568]
-
blk.13.ffn_up.weightQ2_K[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ2_K[8192 1024]
-
blk.13.attn_output.weightQ3_K[8192 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightQ2_K[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.14.ffn_gate.weightQ2_K[8192 29568]
-
blk.14.ffn_up.weightQ2_K[8192 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ2_K[8192 1024]
-
blk.14.attn_output.weightQ3_K[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightQ2_K[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.15.ffn_gate.weightQ2_K[8192 29568]
-
blk.15.ffn_up.weightQ2_K[8192 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ2_K[8192 1024]
-
blk.15.attn_output.weightQ3_K[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightQ2_K[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.16.ffn_gate.weightQ2_K[8192 29568]
-
blk.16.ffn_up.weightQ2_K[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ2_K[8192 1024]
-
blk.16.attn_output.weightQ3_K[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightQ2_K[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192 1024]
-
blk.17.ffn_gate.weightQ2_K[8192 29568]
-
blk.17.ffn_up.weightQ2_K[8192 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ2_K[8192 1024]
-
blk.17.attn_output.weightQ3_K[8192 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightQ2_K[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.18.ffn_gate.weightQ2_K[8192 29568]
-
blk.18.ffn_up.weightQ2_K[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ2_K[8192 1024]
-
blk.18.attn_output.weightQ3_K[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightQ2_K[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.ffn_gate.weightQ2_K[8192 29568]
-
blk.19.ffn_up.weightQ2_K[8192 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ2_K[8192 1024]
-
blk.19.attn_output.weightQ3_K[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightQ2_K[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192 1024]
-
blk.20.ffn_gate.weightQ2_K[8192 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ2_K[8192 1024]
-
blk.20.attn_output.weightQ3_K[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightQ2_K[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.20.ffn_up.weightQ2_K[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.21.ffn_gate.weightQ2_K[8192 29568]
-
blk.21.ffn_up.weightQ2_K[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ2_K[8192 1024]
-
blk.21.attn_output.weightQ3_K[8192 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightQ2_K[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.22.ffn_gate.weightQ2_K[8192 29568]
-
blk.22.ffn_up.weightQ2_K[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ2_K[8192 1024]
-
blk.22.attn_output.weightQ3_K[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightQ2_K[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192 1024]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ2_K[8192 1024]
-
blk.23.attn_output.weightQ3_K[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightQ2_K[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.23.ffn_gate.weightQ2_K[8192 29568]
-
blk.23.ffn_up.weightQ2_K[8192 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.24.ffn_gate.weightQ2_K[8192 29568]
-
blk.24.ffn_up.weightQ2_K[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ2_K[8192 1024]
-
blk.24.attn_output.weightQ3_K[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightQ2_K[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.25.ffn_gate.weightQ2_K[8192 29568]
-
blk.25.ffn_up.weightQ2_K[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ2_K[8192 1024]
-
blk.25.attn_output.weightQ3_K[8192 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightQ2_K[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.26.ffn_gate.weightQ2_K[8192 29568]
-
blk.26.ffn_up.weightQ2_K[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ2_K[8192 1024]
-
blk.26.attn_output.weightQ3_K[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightQ2_K[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.27.ffn_gate.weightQ2_K[8192 29568]
-
blk.27.ffn_up.weightQ2_K[8192 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ2_K[8192 1024]
-
blk.27.attn_output.weightQ3_K[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightQ2_K[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192 1024]
-
blk.28.ffn_gate.weightQ2_K[8192 29568]
-
blk.28.ffn_up.weightQ2_K[8192 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ2_K[8192 1024]
-
blk.28.attn_output.weightQ3_K[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightQ2_K[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.29.ffn_gate.weightQ2_K[8192 29568]
-
blk.29.ffn_up.weightQ2_K[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ2_K[8192 1024]
-
blk.29.attn_output.weightQ3_K[8192 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightQ2_K[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.30.ffn_gate.weightQ2_K[8192 29568]
-
blk.30.ffn_up.weightQ2_K[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ2_K[8192 1024]
-
blk.30.attn_output.weightQ3_K[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightQ2_K[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192 1024]
-
blk.31.ffn_gate.weightQ2_K[8192 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ2_K[8192 1024]
-
blk.31.attn_output.weightQ3_K[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightQ2_K[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.31.ffn_up.weightQ2_K[8192 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.32.ffn_gate.weightQ2_K[8192 29568]
-
blk.32.ffn_up.weightQ2_K[8192 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ2_K[8192 1024]
-
blk.32.attn_output.weightQ3_K[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightQ2_K[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.33.ffn_gate.weightQ2_K[8192 29568]
-
blk.33.ffn_up.weightQ2_K[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ2_K[8192 1024]
-
blk.33.attn_output.weightQ3_K[8192 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightQ2_K[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192 1024]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ2_K[8192 1024]
-
blk.34.attn_output.weightQ3_K[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightQ2_K[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.34.ffn_gate.weightQ2_K[8192 29568]
-
blk.34.ffn_up.weightQ2_K[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.35.ffn_gate.weightQ2_K[8192 29568]
-
blk.35.ffn_up.weightQ2_K[8192 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ2_K[8192 1024]
-
blk.35.attn_output.weightQ3_K[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightQ2_K[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.36.ffn_gate.weightQ2_K[8192 29568]
-
blk.36.ffn_up.weightQ2_K[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ2_K[8192 1024]
-
blk.36.attn_output.weightQ3_K[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightQ2_K[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.ffn_gate.weightQ2_K[8192 29568]
-
blk.37.ffn_up.weightQ2_K[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ2_K[8192 1024]
-
blk.37.attn_output.weightQ3_K[8192 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightQ2_K[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.38.ffn_gate.weightQ2_K[8192 29568]
-
blk.38.ffn_up.weightQ2_K[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ2_K[8192 1024]
-
blk.38.attn_output.weightQ3_K[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightQ2_K[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192 1024]
-
blk.39.ffn_gate.weightQ2_K[8192 29568]
-
blk.39.ffn_up.weightQ2_K[8192 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ2_K[8192 1024]
-
blk.39.attn_output.weightQ3_K[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightQ2_K[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.40.ffn_gate.weightQ2_K[8192 29568]
-
blk.40.ffn_up.weightQ2_K[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ2_K[8192 1024]
-
blk.40.attn_output.weightQ3_K[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightQ2_K[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.41.ffn_gate.weightQ2_K[8192 29568]
-
blk.41.ffn_up.weightQ2_K[8192 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ2_K[8192 1024]
-
blk.41.attn_output.weightQ3_K[8192 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightQ2_K[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192 1024]
-
blk.42.ffn_gate.weightQ2_K[8192 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ2_K[8192 1024]
-
blk.42.attn_output.weightQ3_K[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightQ2_K[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.42.ffn_up.weightQ2_K[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.43.ffn_gate.weightQ2_K[8192 29568]
-
blk.43.ffn_up.weightQ2_K[8192 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ2_K[8192 1024]
-
blk.43.attn_output.weightQ3_K[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightQ2_K[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.44.ffn_gate.weightQ2_K[8192 29568]
-
blk.44.ffn_up.weightQ2_K[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ2_K[8192 1024]
-
blk.44.attn_output.weightQ3_K[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightQ2_K[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192 1024]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ2_K[8192 1024]
-
blk.45.attn_output.weightQ3_K[8192 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightQ2_K[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.45.ffn_gate.weightQ2_K[8192 29568]
-
blk.45.ffn_up.weightQ2_K[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.ffn_gate.weightQ2_K[8192 29568]
-
blk.46.ffn_up.weightQ2_K[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ2_K[8192 1024]
-
blk.46.attn_output.weightQ3_K[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightQ2_K[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.47.ffn_gate.weightQ2_K[8192 29568]
-
blk.47.ffn_up.weightQ2_K[8192 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ2_K[8192 1024]
-
blk.47.attn_output.weightQ3_K[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightQ2_K[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.48.ffn_gate.weightQ2_K[8192 29568]
-
blk.48.ffn_up.weightQ2_K[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ2_K[8192 1024]
-
blk.48.attn_output.weightQ3_K[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightQ2_K[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.49.ffn_gate.weightQ2_K[8192 29568]
-
blk.49.ffn_up.weightQ2_K[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ2_K[8192 1024]
-
blk.49.attn_output.weightQ3_K[8192 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightQ2_K[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192 1024]
-
blk.50.ffn_gate.weightQ2_K[8192 29568]
-
blk.50.ffn_up.weightQ2_K[8192 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ2_K[8192 1024]
-
blk.50.attn_output.weightQ3_K[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightQ2_K[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.51.ffn_gate.weightQ2_K[8192 29568]
-
blk.51.ffn_up.weightQ2_K[8192 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ2_K[8192 1024]
-
blk.51.attn_output.weightQ3_K[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightQ2_K[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.52.ffn_gate.weightQ2_K[8192 29568]
-
blk.52.ffn_up.weightQ2_K[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ2_K[8192 1024]
-
blk.52.attn_output.weightQ3_K[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightQ2_K[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192 1024]
-
blk.53.ffn_gate.weightQ2_K[8192 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ2_K[8192 1024]
-
blk.53.attn_output.weightQ3_K[8192 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightQ2_K[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.53.ffn_up.weightQ2_K[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.54.ffn_gate.weightQ2_K[8192 29568]
-
blk.54.ffn_up.weightQ2_K[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ2_K[8192 1024]
-
blk.54.attn_output.weightQ3_K[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightQ2_K[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.ffn_gate.weightQ2_K[8192 29568]
-
blk.55.ffn_up.weightQ2_K[8192 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ2_K[8192 1024]
-
blk.55.attn_output.weightQ3_K[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightQ2_K[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192 1024]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ2_K[8192 1024]
-
blk.56.attn_output.weightQ3_K[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightQ2_K[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.56.ffn_gate.weightQ2_K[8192 29568]
-
blk.56.ffn_up.weightQ2_K[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.57.ffn_gate.weightQ2_K[8192 29568]
-
blk.57.ffn_up.weightQ2_K[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ2_K[8192 1024]
-
blk.57.attn_output.weightQ3_K[8192 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightQ2_K[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.58.ffn_gate.weightQ2_K[8192 29568]
-
blk.58.ffn_up.weightQ2_K[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ2_K[8192 1024]
-
blk.58.attn_output.weightQ3_K[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightQ2_K[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.59.ffn_gate.weightQ2_K[8192 29568]
-
blk.59.ffn_up.weightQ2_K[8192 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ2_K[8192 1024]
-
blk.59.attn_output.weightQ3_K[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightQ2_K[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.60.ffn_gate.weightQ2_K[8192 29568]
-
blk.60.ffn_up.weightQ2_K[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ2_K[8192 1024]
-
blk.60.attn_output.weightQ3_K[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightQ2_K[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192 1024]
-
blk.61.ffn_gate.weightQ2_K[8192 29568]
-
blk.61.ffn_up.weightQ2_K[8192 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ2_K[8192 1024]
-
blk.61.attn_output.weightQ3_K[8192 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightQ2_K[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.62.ffn_gate.weightQ2_K[8192 29568]
-
blk.62.ffn_up.weightQ2_K[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ2_K[8192 1024]
-
blk.62.attn_output.weightQ3_K[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightQ2_K[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.63.ffn_gate.weightQ2_K[8192 29568]
-
blk.63.ffn_up.weightQ2_K[8192 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ2_K[8192 1024]
-
blk.63.attn_output.weightQ3_K[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightQ2_K[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192 1024]
-
blk.64.ffn_gate.weightQ2_K[8192 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightQ2_K[8192 1024]
-
blk.64.attn_output.weightQ3_K[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightQ2_K[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.ffn_up.weightQ2_K[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.65.ffn_gate.weightQ2_K[8192 29568]
-
blk.65.ffn_up.weightQ2_K[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightQ2_K[8192 1024]
-
blk.65.attn_output.weightQ3_K[8192 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightQ2_K[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.66.ffn_gate.weightQ2_K[8192 29568]
-
blk.66.ffn_up.weightQ2_K[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightQ2_K[8192 1024]
-
blk.66.attn_output.weightQ3_K[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightQ2_K[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192 1024]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightQ2_K[8192 1024]
-
blk.67.attn_output.weightQ3_K[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightQ2_K[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.67.ffn_gate.weightQ2_K[8192 29568]
-
blk.67.ffn_up.weightQ2_K[8192 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.68.ffn_gate.weightQ2_K[8192 29568]
-
blk.68.ffn_up.weightQ2_K[8192 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightQ2_K[8192 1024]
-
blk.68.attn_output.weightQ3_K[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightQ2_K[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.69.ffn_gate.weightQ2_K[8192 29568]
-
blk.69.ffn_up.weightQ2_K[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightQ2_K[8192 1024]
-
blk.69.attn_output.weightQ3_K[8192 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightQ2_K[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.70.ffn_gate.weightQ2_K[8192 29568]
-
blk.70.ffn_up.weightQ2_K[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightQ2_K[8192 1024]
-
blk.70.attn_output.weightQ3_K[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightQ2_K[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.71.ffn_gate.weightQ2_K[8192 29568]
-
blk.71.ffn_up.weightQ2_K[8192 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightQ2_K[8192 1024]
-
blk.71.attn_output.weightQ3_K[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightQ2_K[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192 1024]
-
blk.72.ffn_gate.weightQ2_K[8192 29568]
-
blk.72.ffn_up.weightQ2_K[8192 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightQ2_K[8192 1024]
-
blk.72.attn_output.weightQ3_K[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightQ2_K[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.ffn_gate.weightQ2_K[8192 29568]
-
blk.73.ffn_up.weightQ2_K[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightQ2_K[8192 1024]
-
blk.73.attn_output.weightQ3_K[8192 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightQ2_K[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.74.ffn_gate.weightQ2_K[8192 29568]
-
blk.74.ffn_up.weightQ2_K[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightQ2_K[8192 1024]
-
blk.74.attn_output.weightQ3_K[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightQ2_K[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192 1024]
-
blk.75.ffn_gate.weightQ2_K[8192 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightQ2_K[8192 1024]
-
blk.75.attn_output.weightQ3_K[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightQ2_K[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.75.ffn_up.weightQ2_K[8192 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.76.ffn_gate.weightQ2_K[8192 29568]
-
blk.76.ffn_up.weightQ2_K[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightQ2_K[8192 1024]
-
blk.76.attn_output.weightQ3_K[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightQ2_K[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.77.ffn_gate.weightQ2_K[8192 29568]
-
blk.77.ffn_up.weightQ2_K[8192 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightQ2_K[8192 1024]
-
blk.77.attn_output.weightQ3_K[8192 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightQ2_K[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192 1024]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightQ2_K[8192 1024]
-
blk.78.attn_output.weightQ3_K[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightQ2_K[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.78.ffn_gate.weightQ2_K[8192 29568]
-
blk.78.ffn_up.weightQ2_K[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.79.ffn_gate.weightQ2_K[8192 29568]
-
blk.79.ffn_up.weightQ2_K[8192 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightQ2_K[8192 1024]
-
blk.79.attn_output.weightQ3_K[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightQ2_K[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192 1024]
-
output_norm.weightF32[8192]
-
output.weightQ6_K[8192 152064]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79