This model extends LLama-3 70B's context length from 8k to over 1m tokens. [I-Quants]
103 Pulls Updated 5 months ago
e5ac84fc3756 · 38GB
-
general.architecturellama
-
general.file_type30
-
general.nameLlama-3-70B-Instruct-Gradient-1048k
-
general.quantization_version2
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length1048576
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base3.5801654e+09
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count88
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/groups_merged.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128001
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79