This model is based on Qwen2-72b, Dolphin-2.9.2 has a variety of instruction, conversational, and coding skills. It also has initial agentic abilities and supports function calling. Dolphin is uncensored.
467 Pulls Updated 4 months ago
2ee6e8c7ede3 · 41GB
-
general.architectureqwen2
-
general.file_type25
-
general.name..
-
general.quantization_version2
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-05
-
qwen2.block_count80
-
qwen2.context_length131072
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151644
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 20!)[8192, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 20!)[8192, 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 20!)[8192, 29568]
-
output.weightQ6_K[8192, 152064]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79