The latest in the Smaug series - a finetune of Qwen2-72B-Instruct
102 Pulls Updated 4 months ago
15fe4b67ba38 · 32GB
-
general.architectureqwen2
-
general.file_type23
-
general.name..
-
general.quantization_version2
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count80
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.0.ffn_gate.weightI32[8192, 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weightI32[8192, 29568]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.1.ffn_gate.weightI32[8192, 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weightI32[8192, 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.2.ffn_gate.weightI32[8192, 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weightI32[8192, 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.3.ffn_gate.weightI32[8192, 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weightI32[8192, 29568]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.4.ffn_gate.weightI32[8192, 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weightI32[8192, 29568]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.5.ffn_gate.weightI32[8192, 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weightI32[8192, 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.6.ffn_gate.weightI32[8192, 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weightI32[8192, 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.7.ffn_gate.weightI32[8192, 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weightI32[8192, 29568]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.8.ffn_gate.weightI32[8192, 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weightI32[8192, 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.9.ffn_gate.weightI32[8192, 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weightI32[8192, 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.10.ffn_gate.weightI32[8192, 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weightI32[8192, 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.11.ffn_gate.weightI32[8192, 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weightI32[8192, 29568]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.12.ffn_gate.weightI32[8192, 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weightI32[8192, 29568]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.13.ffn_gate.weightI32[8192, 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weightI32[8192, 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.14.ffn_gate.weightI32[8192, 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weightI32[8192, 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.15.ffn_gate.weightI32[8192, 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weightI32[8192, 29568]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.16.ffn_gate.weightI32[8192, 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weightI32[8192, 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.17.ffn_gate.weightI32[8192, 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weightI32[8192, 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.18.ffn_gate.weightI32[8192, 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weightI32[8192, 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.19.ffn_gate.weightI32[8192, 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weightI32[8192, 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.20.ffn_gate.weightI32[8192, 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weightI32[8192, 29568]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.21.ffn_gate.weightI32[8192, 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weightI32[8192, 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.22.ffn_gate.weightI32[8192, 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weightI32[8192, 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.23.ffn_gate.weightI32[8192, 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weightI32[8192, 29568]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.24.ffn_gate.weightI32[8192, 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weightI32[8192, 29568]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.25.ffn_gate.weightI32[8192, 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weightI32[8192, 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.26.ffn_gate.weightI32[8192, 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weightI32[8192, 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.27.ffn_gate.weightI32[8192, 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weightI32[8192, 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.28.ffn_gate.weightI32[8192, 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weightI32[8192, 29568]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.29.ffn_gate.weightI32[8192, 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weightI32[8192, 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.30.ffn_gate.weightI32[8192, 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weightI32[8192, 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.31.ffn_gate.weightI32[8192, 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weightI32[8192, 29568]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.32.ffn_gate.weightI32[8192, 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weightI32[8192, 29568]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.33.ffn_gate.weightI32[8192, 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weightI32[8192, 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.34.ffn_gate.weightI32[8192, 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weightI32[8192, 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.35.ffn_gate.weightI32[8192, 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weightI32[8192, 29568]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.36.ffn_gate.weightI32[8192, 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weightI32[8192, 29568]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.37.ffn_gate.weightI32[8192, 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weightI32[8192, 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.38.ffn_gate.weightI32[8192, 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weightI32[8192, 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.39.ffn_gate.weightI32[8192, 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weightI32[8192, 29568]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.40.ffn_gate.weightI32[8192, 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weightI32[8192, 29568]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.41.ffn_gate.weightI32[8192, 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weightI32[8192, 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.42.ffn_gate.weightI32[8192, 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weightI32[8192, 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.43.ffn_gate.weightI32[8192, 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weightI32[8192, 29568]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.44.ffn_gate.weightI32[8192, 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weightI32[8192, 29568]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.45.ffn_gate.weightI32[8192, 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weightI32[8192, 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.46.ffn_gate.weightI32[8192, 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weightI32[8192, 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.47.ffn_gate.weightI32[8192, 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weightI32[8192, 29568]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.48.ffn_gate.weightI32[8192, 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weightI32[8192, 29568]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.49.ffn_gate.weightI32[8192, 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weightI32[8192, 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.50.ffn_gate.weightI32[8192, 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weightI32[8192, 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.51.ffn_gate.weightI32[8192, 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weightI32[8192, 29568]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.52.ffn_gate.weightI32[8192, 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weightI32[8192, 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.53.ffn_gate.weightI32[8192, 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weightI32[8192, 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.54.ffn_gate.weightI32[8192, 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weightI32[8192, 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.55.ffn_gate.weightI32[8192, 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weightI32[8192, 29568]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.56.ffn_gate.weightI32[8192, 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weightI32[8192, 29568]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.57.ffn_gate.weightI32[8192, 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weightI32[8192, 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.58.ffn_gate.weightI32[8192, 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weightI32[8192, 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.59.ffn_gate.weightI32[8192, 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weightI32[8192, 29568]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.60.ffn_gate.weightI32[8192, 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weightI32[8192, 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.61.ffn_gate.weightI32[8192, 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weightI32[8192, 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.62.ffn_gate.weightI32[8192, 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weightI32[8192, 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.63.ffn_gate.weightI32[8192, 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weightI32[8192, 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.64.ffn_gate.weightI32[8192, 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weightI32[8192, 29568]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.65.ffn_gate.weightI32[8192, 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weightI32[8192, 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.66.ffn_gate.weightI32[8192, 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weightI32[8192, 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.67.ffn_gate.weightI32[8192, 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weightI32[8192, 29568]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.68.ffn_gate.weightI32[8192, 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weightI32[8192, 29568]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.69.ffn_gate.weightI32[8192, 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weightI32[8192, 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.70.ffn_gate.weightI32[8192, 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weightI32[8192, 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.71.ffn_gate.weightI32[8192, 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weightI32[8192, 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.72.ffn_gate.weightI32[8192, 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weightI32[8192, 29568]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.73.ffn_gate.weightI32[8192, 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weightI32[8192, 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.74.ffn_gate.weightI32[8192, 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weightI32[8192, 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.75.ffn_gate.weightI32[8192, 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weightI32[8192, 29568]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.76.ffn_gate.weightI32[8192, 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weightI32[8192, 29568]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.77.ffn_gate.weightI32[8192, 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weightI32[8192, 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.78.ffn_gate.weightI32[8192, 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weightI32[8192, 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.79.ffn_gate.weightI32[8192, 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weightI32[8192, 29568]
-
output.weightQ5_K[8192, 152064]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79