Hermes 3 Llama-3.1 70b Model by NousResearch
tools
105 Pulls Updated 2 months ago
c309e5635bee · 40GB
-
general.architecturellama
-
general.base_model.0.nameMeta Llama 3.1 70B
-
general.base_model.0.organizationMeta Llama
-
general.base_model.0.repo_urlhttps://huggingface.co/meta-llama/Meta-Llama-3.1-70B
-
general.base_model.count1
-
general.file_type25
-
general.finetune..
-
general.languages[en]
-
general.licensellama3
-
general.name..
-
general.quantization_version2
-
general.size_label71B
-
general.tags[Llama-3, instruct, finetune, chatml, gpt4, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count124
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128039
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128001
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 20!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79