Llama 3.1 70b IQs: IQ1_M, IQ2_M, IQ2_S, IQ2_XS, IQ2_XXS, IQ3_XS, IQ4_XS
tools
107 Pulls Updated 3 months ago
4a9755870610 · 38GB
-
general.architecturellama
-
general.basenameMeta-Llama-3.1
-
general.file_type30
-
general.finetuneInstruct
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.nameMeta Llama 3.1 70B Instruct
-
general.quantization_version2
-
general.size_label70B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models_out/Meta-Llama-3.1-70B-Instruct-GGUF/Meta-Llama-3.1-70B-Instruct.imatrix
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 23!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 23!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 23!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 23!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 23!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79