I-quants for meta-llama-3.1-70b-instruct
tools
71 Pulls Updated 8 weeks ago
043b594eeff2 · 24GB
-
general.architecturellama
-
general.basenamemeta-llama_Meta-Llama-3.1
-
general.file_type29
-
general.finetuneInstruct
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.nameMeta llama_Meta Llama 3.1 70B Instruct
-
general.quantization_version2
-
general.size_label70B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.datasetmisc/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.filegguf/Meta-Llama-3.1-70B-Instruct/imatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.0.attn_v.weightQ4_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.1.attn_v.weightQ4_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.2.attn_v.weightQ4_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.3.attn_v.weightQ4_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.4.attn_v.weightQ4_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.5.attn_v.weightQ4_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.6.attn_v.weightQ4_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.7.attn_v.weightQ4_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.8.attn_v.weightQ4_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.9.attn_v.weightQ4_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.10.attn_v.weightQ4_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.11.attn_v.weightQ4_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.12.attn_v.weightQ4_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.13.attn_v.weightQ4_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.14.attn_v.weightQ4_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.15.attn_v.weightQ4_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.16.attn_v.weightQ4_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.17.attn_v.weightQ4_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.18.attn_v.weightQ4_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.19.attn_v.weightQ4_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.20.attn_v.weightQ4_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.21.attn_v.weightQ4_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.22.attn_v.weightQ4_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.23.attn_v.weightQ4_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.24.attn_v.weightQ4_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.25.attn_v.weightQ4_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.26.attn_v.weightQ4_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.27.attn_v.weightQ4_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.28.attn_v.weightQ4_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.29.attn_v.weightQ4_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.30.attn_v.weightQ4_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.31.attn_v.weightQ4_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.32.attn_v.weightQ4_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.33.attn_v.weightQ4_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.34.attn_v.weightQ4_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.35.attn_v.weightQ4_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.36.attn_v.weightQ4_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.37.attn_v.weightQ4_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.38.attn_v.weightQ4_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.39.attn_v.weightQ4_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.40.attn_v.weightQ4_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.41.attn_v.weightQ4_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.42.attn_v.weightQ4_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.43.attn_v.weightQ4_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.44.attn_v.weightQ4_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.45.attn_v.weightQ4_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.46.attn_v.weightQ4_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.47.attn_v.weightQ4_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.48.attn_v.weightQ4_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.49.attn_v.weightQ4_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.50.attn_v.weightQ4_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.51.attn_v.weightQ4_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.52.attn_v.weightQ4_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.53.attn_v.weightQ4_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.54.attn_v.weightQ4_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.55.attn_v.weightQ4_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.56.attn_v.weightQ4_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.57.attn_v.weightQ4_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.58.attn_v.weightQ4_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.59.attn_v.weightQ4_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.60.attn_v.weightQ4_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.61.attn_v.weightQ4_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.62.attn_v.weightQ4_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.63.attn_v.weightQ4_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.64.attn_v.weightQ4_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.65.attn_v.weightQ4_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.66.attn_v.weightQ4_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.67.attn_v.weightQ4_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.68.attn_v.weightQ4_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.69.attn_v.weightQ4_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.70.attn_v.weightQ4_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.71.attn_v.weightQ4_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.72.attn_v.weightQ4_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.73.attn_v.weightQ4_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.74.attn_v.weightQ4_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.75.attn_v.weightQ4_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.76.attn_v.weightQ4_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.77.attn_v.weightQ4_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.78.attn_v.weightQ4_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 22!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 22!)[8192, 8192]
-
blk.79.attn_v.weightQ4_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 22!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 22!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 22!)[8192, 28672]
-
output.weightQ5_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79