The latest in the Smaug series - a finetune of Qwen2-72B-Instruct
102 Pulls Updated 4 months ago
bebf85017264 · 41GB
-
general.architectureqwen2
-
general.file_type25
-
general.name..
-
general.quantization_version2
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count80
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 20!)[8192, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
output.weightQ6_K[8192, 152064]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79