I-quants for meta-llama-3.1-70b-instruct
tools
72 Pulls Updated 8 weeks ago
126545ee368e · 29GB
-
general.architecturellama
-
general.basenamemeta-llama_Meta-Llama-3.1
-
general.file_type22
-
general.finetuneInstruct
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.nameMeta llama_Meta Llama 3.1 70B Instruct
-
general.quantization_version2
-
general.size_label70B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.datasetmisc/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.filegguf/Meta-Llama-3.1-70B-Instruct/imatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 128256]
-
blk.0.attn_k.weightI32[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.weightI32[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.attn_k.weightI32[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.weightI32[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.attn_k.weightI32[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.weightI32[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.attn_k.weightI32[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.weightI32[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.attn_k.weightI32[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.weightI32[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.attn_k.weightI32[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.weightI32[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.attn_k.weightI32[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.weightI32[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.attn_k.weightI32[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.weightI32[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.attn_k.weightI32[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.weightI32[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.attn_k.weightI32[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.weightI32[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.10.attn_k.weightI32[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.weightI32[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.10.ffn_gate.weightI32[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weightI32[8192, 28672]
-
blk.11.attn_k.weightI32[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.weightI32[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.11.ffn_gate.weightI32[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weightI32[8192, 28672]
-
blk.12.attn_k.weightI32[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.weightI32[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.12.ffn_gate.weightI32[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weightI32[8192, 28672]
-
blk.13.attn_k.weightI32[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.weightI32[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.13.ffn_gate.weightI32[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weightI32[8192, 28672]
-
blk.14.attn_k.weightI32[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.weightI32[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.14.ffn_gate.weightI32[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weightI32[8192, 28672]
-
blk.15.attn_k.weightI32[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.weightI32[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.15.ffn_gate.weightI32[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weightI32[8192, 28672]
-
blk.16.attn_k.weightI32[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.weightI32[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.16.ffn_gate.weightI32[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weightI32[8192, 28672]
-
blk.17.attn_k.weightI32[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.weightI32[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.17.ffn_gate.weightI32[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weightI32[8192, 28672]
-
blk.18.attn_k.weightI32[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.weightI32[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.18.ffn_gate.weightI32[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weightI32[8192, 28672]
-
blk.19.attn_k.weightI32[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.weightI32[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.19.ffn_gate.weightI32[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weightI32[8192, 28672]
-
blk.20.attn_k.weightI32[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.weightI32[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.20.ffn_gate.weightI32[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weightI32[8192, 28672]
-
blk.21.attn_k.weightI32[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.weightI32[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.21.ffn_gate.weightI32[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weightI32[8192, 28672]
-
blk.22.attn_k.weightI32[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.weightI32[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.22.ffn_gate.weightI32[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weightI32[8192, 28672]
-
blk.23.attn_k.weightI32[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.weightI32[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.23.ffn_gate.weightI32[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weightI32[8192, 28672]
-
blk.24.attn_k.weightI32[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.weightI32[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.24.ffn_gate.weightI32[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weightI32[8192, 28672]
-
blk.25.attn_k.weightI32[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.weightI32[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.25.ffn_gate.weightI32[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weightI32[8192, 28672]
-
blk.26.attn_k.weightI32[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.weightI32[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.26.ffn_gate.weightI32[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weightI32[8192, 28672]
-
blk.27.attn_k.weightI32[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.weightI32[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.27.ffn_gate.weightI32[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weightI32[8192, 28672]
-
blk.28.attn_k.weightI32[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.weightI32[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.28.ffn_gate.weightI32[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weightI32[8192, 28672]
-
blk.29.attn_k.weightI32[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.weightI32[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.29.ffn_gate.weightI32[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weightI32[8192, 28672]
-
blk.30.attn_k.weightI32[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.weightI32[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.30.ffn_gate.weightI32[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weightI32[8192, 28672]
-
blk.31.attn_k.weightI32[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.weightI32[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.31.ffn_gate.weightI32[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weightI32[8192, 28672]
-
blk.32.attn_k.weightI32[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.weightI32[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.32.ffn_gate.weightI32[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weightI32[8192, 28672]
-
blk.33.attn_k.weightI32[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.weightI32[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.33.ffn_gate.weightI32[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weightI32[8192, 28672]
-
blk.34.attn_k.weightI32[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.weightI32[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.34.ffn_gate.weightI32[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weightI32[8192, 28672]
-
blk.35.attn_k.weightI32[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.weightI32[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.35.ffn_gate.weightI32[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weightI32[8192, 28672]
-
blk.36.attn_k.weightI32[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.weightI32[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.36.ffn_gate.weightI32[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weightI32[8192, 28672]
-
blk.37.attn_k.weightI32[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.weightI32[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.37.ffn_gate.weightI32[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weightI32[8192, 28672]
-
blk.38.attn_k.weightI32[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.weightI32[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.38.ffn_gate.weightI32[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weightI32[8192, 28672]
-
blk.39.attn_k.weightI32[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.weightI32[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.39.ffn_gate.weightI32[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weightI32[8192, 28672]
-
blk.40.attn_k.weightI32[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.weightI32[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.40.ffn_gate.weightI32[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weightI32[8192, 28672]
-
blk.41.attn_k.weightI32[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.weightI32[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.41.ffn_gate.weightI32[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weightI32[8192, 28672]
-
blk.42.attn_k.weightI32[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.weightI32[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.42.ffn_gate.weightI32[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weightI32[8192, 28672]
-
blk.43.attn_k.weightI32[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.weightI32[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.43.ffn_gate.weightI32[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weightI32[8192, 28672]
-
blk.44.attn_k.weightI32[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.weightI32[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.44.ffn_gate.weightI32[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weightI32[8192, 28672]
-
blk.45.attn_k.weightI32[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.weightI32[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.45.ffn_gate.weightI32[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weightI32[8192, 28672]
-
blk.46.attn_k.weightI32[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.weightI32[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.46.ffn_gate.weightI32[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weightI32[8192, 28672]
-
blk.47.attn_k.weightI32[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.weightI32[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.47.ffn_gate.weightI32[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weightI32[8192, 28672]
-
blk.48.attn_k.weightI32[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.weightI32[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.48.ffn_gate.weightI32[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weightI32[8192, 28672]
-
blk.49.attn_k.weightI32[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.weightI32[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.49.ffn_gate.weightI32[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weightI32[8192, 28672]
-
blk.50.attn_k.weightI32[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.weightI32[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.50.ffn_gate.weightI32[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weightI32[8192, 28672]
-
blk.51.attn_k.weightI32[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.weightI32[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.51.ffn_gate.weightI32[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weightI32[8192, 28672]
-
blk.52.attn_k.weightI32[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.weightI32[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.52.ffn_gate.weightI32[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weightI32[8192, 28672]
-
blk.53.attn_k.weightI32[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.weightI32[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.53.ffn_gate.weightI32[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weightI32[8192, 28672]
-
blk.54.attn_k.weightI32[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.weightI32[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.54.ffn_gate.weightI32[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weightI32[8192, 28672]
-
blk.55.attn_k.weightI32[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.weightI32[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.55.ffn_gate.weightI32[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weightI32[8192, 28672]
-
blk.56.attn_k.weightI32[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.weightI32[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.56.ffn_gate.weightI32[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weightI32[8192, 28672]
-
blk.57.attn_k.weightI32[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.weightI32[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.57.ffn_gate.weightI32[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weightI32[8192, 28672]
-
blk.58.attn_k.weightI32[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.weightI32[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.58.ffn_gate.weightI32[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weightI32[8192, 28672]
-
blk.59.attn_k.weightI32[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.weightI32[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.59.ffn_gate.weightI32[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weightI32[8192, 28672]
-
blk.60.attn_k.weightI32[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.weightI32[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.60.ffn_gate.weightI32[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weightI32[8192, 28672]
-
blk.61.attn_k.weightI32[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.weightI32[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.61.ffn_gate.weightI32[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weightI32[8192, 28672]
-
blk.62.attn_k.weightI32[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.weightI32[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.62.ffn_gate.weightI32[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weightI32[8192, 28672]
-
blk.63.attn_k.weightI32[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.weightI32[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.63.ffn_gate.weightI32[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weightI32[8192, 28672]
-
blk.64.attn_k.weightI32[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.weightI32[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.64.ffn_gate.weightI32[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weightI32[8192, 28672]
-
blk.65.attn_k.weightI32[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.weightI32[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.65.ffn_gate.weightI32[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weightI32[8192, 28672]
-
blk.66.attn_k.weightI32[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.weightI32[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.66.ffn_gate.weightI32[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weightI32[8192, 28672]
-
blk.67.attn_k.weightI32[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.weightI32[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.67.ffn_gate.weightI32[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weightI32[8192, 28672]
-
blk.68.attn_k.weightI32[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.weightI32[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.68.ffn_gate.weightI32[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weightI32[8192, 28672]
-
blk.69.attn_k.weightI32[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.weightI32[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.69.ffn_gate.weightI32[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weightI32[8192, 28672]
-
blk.70.attn_k.weightI32[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.weightI32[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.attn_k.weightI32[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.weightI32[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.attn_k.weightI32[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.weightI32[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.attn_k.weightI32[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.weightI32[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.attn_k.weightI32[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.weightI32[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.attn_k.weightI32[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.weightI32[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.attn_k.weightI32[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.weightI32[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.attn_k.weightI32[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.weightI32[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.attn_k.weightI32[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.weightI32[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.attn_k.weightI32[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.weightI32[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 21!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 21!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79