This model was built using a new Smaug recipe for improving performance on real world multi-turn conversations applied to Meta-Llama-3-70B-Instruct, 32k context length
134 Pulls Updated 5 months ago
95e7fee88dd4 · 38GB
-
general.architecturellama
-
general.file_type30
-
general.name..
-
general.quantization_version2
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length32768
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base3e+06
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count88
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/groups_merged.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128001
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128001
-
tokenizer.ggml.presmaug-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79