Llama 3.1 70b IQs: IQ1_M, IQ2_M, IQ2_S, IQ2_XS, IQ2_XXS, IQ3_XS, IQ4_XS
tools
97 Pulls Updated 3 months ago
0695183f116d · 17GB
-
general.architecturellama
-
general.basenameMeta-Llama-3.1
-
general.file_type31
-
general.finetuneInstruct
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.nameMeta Llama 3.1 70B Instruct
-
general.quantization_version2
-
general.size_label70B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models_out/Meta-Llama-3.1-70B-Instruct-GGUF/Meta-Llama-3.1-70B-Instruct.imatrix
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weightI8[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.0.attn_v.weightQ4_K[8192, 1024]
-
blk.0.ffn_down.weightQ2_K[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weightI8[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.1.attn_v.weightQ4_K[8192, 1024]
-
blk.1.ffn_down.weightQ2_K[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weightI8[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.2.attn_v.weightQ4_K[8192, 1024]
-
blk.2.ffn_down.weightQ2_K[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weightI8[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.3.attn_v.weightQ4_K[8192, 1024]
-
blk.3.ffn_down.weightQ2_K[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weightI8[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.4.attn_v.weightQ4_K[8192, 1024]
-
blk.4.ffn_down.weightQ2_K[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weightI8[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.5.attn_v.weightQ4_K[8192, 1024]
-
blk.5.ffn_down.weightQ2_K[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weightI8[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.6.attn_v.weightQ4_K[8192, 1024]
-
blk.6.ffn_down.weightQ2_K[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weightI8[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.7.attn_v.weightQ4_K[8192, 1024]
-
blk.7.ffn_down.weightQ2_K[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weightI8[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.8.attn_v.weightQ4_K[8192, 1024]
-
blk.8.ffn_down.weightQ2_K[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weightI8[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.9.attn_v.weightQ4_K[8192, 1024]
-
blk.9.ffn_down.weightQ2_K[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weightI8[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.10.attn_v.weightQ4_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weightI8[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.11.attn_v.weightQ4_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weightI8[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.12.attn_v.weightQ4_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weightI8[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.13.attn_v.weightQ4_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weightI8[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.14.attn_v.weightQ4_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weightI8[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.15.attn_v.weightQ4_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weightI8[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.16.attn_v.weightQ4_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weightI8[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.17.attn_v.weightQ4_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weightI8[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.18.attn_v.weightQ4_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weightI8[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.19.attn_v.weightQ4_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weightI8[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.20.attn_v.weightQ4_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weightI8[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.21.attn_v.weightQ4_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weightI8[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.22.attn_v.weightQ4_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weightI8[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.23.attn_v.weightQ4_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weightI8[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.24.attn_v.weightQ4_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weightI8[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.25.attn_v.weightQ4_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weightI8[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.26.attn_v.weightQ4_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weightI8[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.27.attn_v.weightQ4_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weightI8[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.28.attn_v.weightQ4_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weightI8[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.29.attn_v.weightQ4_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weightI8[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.30.attn_v.weightQ4_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weightI8[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.31.attn_v.weightQ4_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weightI8[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.32.attn_v.weightQ4_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weightI8[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.33.attn_v.weightQ4_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weightI8[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.34.attn_v.weightQ4_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weightI8[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.35.attn_v.weightQ4_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weightI8[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.36.attn_v.weightQ4_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weightI8[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.37.attn_v.weightQ4_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weightI8[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.38.attn_v.weightQ4_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weightI8[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.39.attn_v.weightQ4_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weightI8[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.40.attn_v.weightQ4_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weightI8[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.41.attn_v.weightQ4_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weightI8[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.42.attn_v.weightQ4_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weightI8[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.43.attn_v.weightQ4_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weightI8[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.44.attn_v.weightQ4_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weightI8[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.45.attn_v.weightQ4_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weightI8[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.46.attn_v.weightQ4_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weightI8[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.47.attn_v.weightQ4_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weightI8[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.48.attn_v.weightQ4_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weightI8[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.49.attn_v.weightQ4_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weightI8[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.50.attn_v.weightQ4_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weightI8[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.51.attn_v.weightQ4_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weightI8[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.52.attn_v.weightQ4_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weightI8[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.53.attn_v.weightQ4_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weightI8[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.54.attn_v.weightQ4_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weightI8[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.55.attn_v.weightQ4_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weightI8[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.56.attn_v.weightQ4_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weightI8[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.57.attn_v.weightQ4_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weightI8[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.58.attn_v.weightQ4_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weightI8[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.59.attn_v.weightQ4_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weightI8[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.60.attn_v.weightQ4_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weightI8[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.61.attn_v.weightQ4_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weightI8[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.62.attn_v.weightQ4_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weightI8[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.63.attn_v.weightQ4_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weightI8[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.64.attn_v.weightQ4_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weightI8[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.65.attn_v.weightQ4_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weightI8[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.66.attn_v.weightQ4_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weightI8[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.67.attn_v.weightQ4_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weightI8[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.68.attn_v.weightQ4_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weightI8[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.69.attn_v.weightQ4_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weightI8[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.70.attn_v.weightQ4_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weightI8[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.71.attn_v.weightQ4_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weightI8[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.72.attn_v.weightQ4_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weightI8[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.73.attn_v.weightQ4_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weightI8[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.74.attn_v.weightQ4_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weightI8[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.75.attn_v.weightQ4_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weightI8[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.76.attn_v.weightQ4_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weightI8[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.77.attn_v.weightQ4_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weightI8[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.78.attn_v.weightQ4_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weightI8[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.79.attn_v.weightQ4_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
output.weightQ5_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79