New state-of-the-art model from Meta available in 8B, 70B and 405B sizes
tools
168 Pulls Updated 3 months ago
1e21397096b5 · 40GB
-
general.architecturellama
-
general.file_type25
-
general.finetune..
-
general.languages[en, de, fr, it, pt, ...]
-
general.licensellama3.1
-
general.name..
-
general.quantization_version2
-
general.size_label71B
-
general.tags[facebook, meta, pytorch, llama, llama-3, ...]
-
general.typemodel
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count62
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 20!)[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.0.attn_v.weightQ5_K[8192, 1024]
-
blk.0.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.1.attn_v.weightQ5_K[8192, 1024]
-
blk.1.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.2.attn_v.weightQ5_K[8192, 1024]
-
blk.2.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.3.attn_v.weightQ5_K[8192, 1024]
-
blk.3.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.4.attn_v.weightQ5_K[8192, 1024]
-
blk.4.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.5.attn_v.weightQ5_K[8192, 1024]
-
blk.5.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.6.attn_v.weightQ5_K[8192, 1024]
-
blk.6.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.7.attn_v.weightQ5_K[8192, 1024]
-
blk.7.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.8.attn_v.weightQ5_K[8192, 1024]
-
blk.8.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.9.attn_v.weightQ5_K[8192, 1024]
-
blk.9.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.10.attn_v.weightQ5_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.11.attn_v.weightQ5_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.12.attn_v.weightQ5_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.13.attn_v.weightQ5_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.14.attn_v.weightQ5_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.15.attn_v.weightQ5_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.16.attn_v.weightQ5_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.17.attn_v.weightQ5_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.18.attn_v.weightQ5_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.19.attn_v.weightQ5_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.20.attn_v.weightQ5_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.21.attn_v.weightQ5_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.22.attn_v.weightQ5_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.23.attn_v.weightQ5_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.24.attn_v.weightQ5_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.25.attn_v.weightQ5_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.26.attn_v.weightQ5_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.27.attn_v.weightQ5_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.28.attn_v.weightQ5_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.29.attn_v.weightQ5_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.30.attn_v.weightQ5_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.31.attn_v.weightQ5_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.32.attn_v.weightQ5_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.33.attn_v.weightQ5_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.34.attn_v.weightQ5_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.35.attn_v.weightQ5_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.36.attn_v.weightQ5_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.37.attn_v.weightQ5_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.38.attn_v.weightQ5_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.39.attn_v.weightQ5_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.40.attn_v.weightQ5_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.41.attn_v.weightQ5_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.42.attn_v.weightQ5_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.43.attn_v.weightQ5_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.44.attn_v.weightQ5_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.45.attn_v.weightQ5_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.46.attn_v.weightQ5_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.47.attn_v.weightQ5_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.48.attn_v.weightQ5_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.49.attn_v.weightQ5_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.50.attn_v.weightQ5_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.51.attn_v.weightQ5_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.52.attn_v.weightQ5_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.53.attn_v.weightQ5_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.54.attn_v.weightQ5_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.55.attn_v.weightQ5_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.56.attn_v.weightQ5_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.57.attn_v.weightQ5_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.58.attn_v.weightQ5_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.59.attn_v.weightQ5_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.60.attn_v.weightQ5_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.61.attn_v.weightQ5_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.62.attn_v.weightQ5_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.63.attn_v.weightQ5_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.64.attn_v.weightQ5_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.65.attn_v.weightQ5_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.66.attn_v.weightQ5_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.67.attn_v.weightQ5_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.68.attn_v.weightQ5_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.69.attn_v.weightQ5_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.70.attn_v.weightQ5_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.71.attn_v.weightQ5_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.72.attn_v.weightQ5_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.73.attn_v.weightQ5_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.74.attn_v.weightQ5_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.75.attn_v.weightQ5_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.76.attn_v.weightQ5_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.77.attn_v.weightQ5_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.78.attn_v.weightQ5_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 20!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 20!)[8192, 8192]
-
blk.79.attn_v.weightQ5_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 20!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 20!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 20!)[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
rope_freqs.weightF32[64]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79