New state-of-the-art model from Meta available in 8B, 70B and 405B sizes
tools
168 Pulls Updated 3 months ago
5ac3b2446ffe · 31GB
-
general.architecturellama
-
general.file_type26
-
general.finetune..
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.name..
-
general.quantization_version2
-
general.size_label71B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count62
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 21!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79