Llama 3.1 70b IQs: IQ1_M, IQ2_M, IQ2_S, IQ2_XS, IQ2_XXS, IQ3_XS, IQ4_XS
tools
97 Pulls Updated 3 months ago
2bc4fc6cb5c8 · 24GB
-
general.architecturellama
-
general.basenameMeta-Llama-3.1
-
general.file_type29
-
general.finetuneInstruct
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.nameMeta Llama 3.1 70B Instruct
-
general.quantization_version2
-
general.size_label70B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models_out/Meta-Llama-3.1-70B-Instruct-GGUF/Meta-Llama-3.1-70B-Instruct.imatrix
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.0.attn_v.weightQ4_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.1.attn_v.weightQ4_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.2.attn_v.weightQ4_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.3.attn_v.weightQ4_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.4.attn_v.weightQ4_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.5.attn_v.weightQ4_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.6.attn_v.weightQ4_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.7.attn_v.weightQ4_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.8.attn_v.weightQ4_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.9.attn_v.weightQ4_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.10.attn_v.weightQ4_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.11.attn_v.weightQ4_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.12.attn_v.weightQ4_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.13.attn_v.weightQ4_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.14.attn_v.weightQ4_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.15.attn_v.weightQ4_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.16.attn_v.weightQ4_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.17.attn_v.weightQ4_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.18.attn_v.weightQ4_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.19.attn_v.weightQ4_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.20.attn_v.weightQ4_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.21.attn_v.weightQ4_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.22.attn_v.weightQ4_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.23.attn_v.weightQ4_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.24.attn_v.weightQ4_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.25.attn_v.weightQ4_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.26.attn_v.weightQ4_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.27.attn_v.weightQ4_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.28.attn_v.weightQ4_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.29.attn_v.weightQ4_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.30.attn_v.weightQ4_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.31.attn_v.weightQ4_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.32.attn_v.weightQ4_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.33.attn_v.weightQ4_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.34.attn_v.weightQ4_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.35.attn_v.weightQ4_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.36.attn_v.weightQ4_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.37.attn_v.weightQ4_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.38.attn_v.weightQ4_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.39.attn_v.weightQ4_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.40.attn_v.weightQ4_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.41.attn_v.weightQ4_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.42.attn_v.weightQ4_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.43.attn_v.weightQ4_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.44.attn_v.weightQ4_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.45.attn_v.weightQ4_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.46.attn_v.weightQ4_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.47.attn_v.weightQ4_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.48.attn_v.weightQ4_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.49.attn_v.weightQ4_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.50.attn_v.weightQ4_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.51.attn_v.weightQ4_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.52.attn_v.weightQ4_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.53.attn_v.weightQ4_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.54.attn_v.weightQ4_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.55.attn_v.weightQ4_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.56.attn_v.weightQ4_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.57.attn_v.weightQ4_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.58.attn_v.weightQ4_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.59.attn_v.weightQ4_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.60.attn_v.weightQ4_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.61.attn_v.weightQ4_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.62.attn_v.weightQ4_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.63.attn_v.weightQ4_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.64.attn_v.weightQ4_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.65.attn_v.weightQ4_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.66.attn_v.weightQ4_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.67.attn_v.weightQ4_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.68.attn_v.weightQ4_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.69.attn_v.weightQ4_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.70.attn_v.weightQ4_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.71.attn_v.weightQ4_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.72.attn_v.weightQ4_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.73.attn_v.weightQ4_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.74.attn_v.weightQ4_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.75.attn_v.weightQ4_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.76.attn_v.weightQ4_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.77.attn_v.weightQ4_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.78.attn_v.weightQ4_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.79.attn_v.weightQ4_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
output.weightQ5_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79