The latest in the Smaug series - a finetune of Qwen2-72B-Instruct
102 Pulls Updated 4 months ago
c18e976972d2 · 40GB
-
general.architectureqwen2
-
general.file_type30
-
general.name..
-
general.quantization_version2
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count80
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[8192, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
output.weightQ6_K[8192, 152064]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79