This model was built using a new Smaug recipe for improving performance on real world multi-turn conversations applied to Meta-Llama-3-70B-Instruct
202 Pulls Updated 5 months ago
a8fde15130ea · 31GB
-
general.architecturellama
-
general.file_type26
-
general.name..
-
general.quantization_version2
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length8192
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count200
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/groups_merged.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128001
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128001
-
tokenizer.ggml.presmaug-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79