This model is based on Qwen2-72b, Dolphin-2.9.2 has a variety of instruction, conversational, and coding skills. It also has initial agentic abilities and supports function calling. Dolphin is uncensored.
467 Pulls Updated 4 months ago
f43c438bc085 · 40GB
-
general.architectureqwen2
-
general.file_type30
-
general.name..
-
general.quantization_version2
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-05
-
qwen2.block_count80
-
qwen2.context_length131072
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151644
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[8192, 152064]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 23!)[8192, 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 23!)[8192, 29568]
-
output.weightQ6_K[8192, 152064]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79