LLM customized by NVIDIA to improve the helpfulness of generated responses #1 on all three automatic alignment benchmarks (verified tab for AlpacaEval 2 LC), edging out strong frontier models such as GPT-4o and Claude 3.5 Sonnet.
70B
38 Pulls Updated 2 hours ago
cddf348aa7dc · 21GB
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file/models_out/Llama-3.1-Nemotron-70B-Instruct-HF-GGUF/Llama-3.1-Nemotron-70B-Instruct-HF.imatrix
-
general.architecturellama
-
general.file_typeIQ2_XS
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ Ġ ĠĠĠ ĠĠ ĠĠ ĠĠĠ Ġ i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 128256]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ2_K[28672 8192]
-
blk.0.ffn_gate.weightI16[8192 28672]
-
blk.0.ffn_up.weightI16[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightI16[8192 1024]
-
blk.0.attn_output.weightI16[8192 8192]
-
blk.0.attn_q.weightI16[8192 8192]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.1.ffn_gate.weightI16[8192 28672]
-
blk.1.attn_k.weightI16[8192 1024]
-
blk.1.attn_output.weightI16[8192 8192]
-
blk.1.attn_q.weightI16[8192 8192]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ2_K[28672 8192]
-
blk.1.ffn_up.weightI16[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ2_K[28672 8192]
-
blk.2.ffn_gate.weightI16[8192 28672]
-
blk.2.ffn_up.weightI16[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightI16[8192 1024]
-
blk.2.attn_output.weightI16[8192 8192]
-
blk.2.attn_q.weightI16[8192 8192]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ2_K[28672 8192]
-
blk.3.ffn_gate.weightI16[8192 28672]
-
blk.3.ffn_up.weightI16[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightI16[8192 1024]
-
blk.3.attn_output.weightI16[8192 8192]
-
blk.3.attn_q.weightI16[8192 8192]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_k.weightI16[8192 1024]
-
blk.4.attn_output.weightI16[8192 8192]
-
blk.4.attn_q.weightI16[8192 8192]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ2_K[28672 8192]
-
blk.4.ffn_gate.weightI16[8192 28672]
-
blk.4.ffn_up.weightI16[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ2_K[28672 8192]
-
blk.5.ffn_gate.weightI16[8192 28672]
-
blk.5.ffn_up.weightI16[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightI16[8192 1024]
-
blk.5.attn_output.weightI16[8192 8192]
-
blk.5.attn_q.weightI16[8192 8192]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ2_K[28672 8192]
-
blk.6.ffn_gate.weightI16[8192 28672]
-
blk.6.ffn_up.weightI16[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightI16[8192 1024]
-
blk.6.attn_output.weightI16[8192 8192]
-
blk.6.attn_q.weightI16[8192 8192]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_k.weightI16[8192 1024]
-
blk.7.attn_q.weightI16[8192 8192]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ2_K[28672 8192]
-
blk.7.ffn_gate.weightI16[8192 28672]
-
blk.7.ffn_up.weightI16[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_output.weightI16[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ2_K[28672 8192]
-
blk.8.ffn_gate.weightI16[8192 28672]
-
blk.8.ffn_up.weightI16[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightI16[8192 1024]
-
blk.8.attn_output.weightI16[8192 8192]
-
blk.8.attn_q.weightI16[8192 8192]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ2_K[28672 8192]
-
blk.9.ffn_gate.weightI16[8192 28672]
-
blk.9.ffn_up.weightI16[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightI16[8192 1024]
-
blk.9.attn_output.weightI16[8192 8192]
-
blk.9.attn_q.weightI16[8192 8192]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightI16[28672 8192]
-
blk.10.ffn_gate.weightI16[8192 28672]
-
blk.10.ffn_up.weightI16[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightI16[8192 1024]
-
blk.10.attn_output.weightI16[8192 8192]
-
blk.10.attn_q.weightI16[8192 8192]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightI16[28672 8192]
-
blk.11.ffn_gate.weightI16[8192 28672]
-
blk.11.ffn_up.weightI16[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightI16[8192 1024]
-
blk.11.attn_output.weightI16[8192 8192]
-
blk.11.attn_q.weightI16[8192 8192]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.12.ffn_gate.weightI16[8192 28672]
-
blk.12.ffn_up.weightI16[8192 28672]
-
blk.12.attn_k.weightI16[8192 1024]
-
blk.12.attn_output.weightI16[8192 8192]
-
blk.12.attn_q.weightI16[8192 8192]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightI16[28672 8192]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightI16[28672 8192]
-
blk.13.ffn_gate.weightI16[8192 28672]
-
blk.13.ffn_up.weightI16[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightI16[8192 1024]
-
blk.13.attn_output.weightI16[8192 8192]
-
blk.13.attn_q.weightI16[8192 8192]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightI16[28672 8192]
-
blk.14.ffn_gate.weightI16[8192 28672]
-
blk.14.ffn_up.weightI16[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightI16[8192 1024]
-
blk.14.attn_output.weightI16[8192 8192]
-
blk.14.attn_q.weightI16[8192 8192]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.15.ffn_gate.weightI16[8192 28672]
-
blk.15.attn_k.weightI16[8192 1024]
-
blk.15.attn_output.weightI16[8192 8192]
-
blk.15.attn_q.weightI16[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightI16[28672 8192]
-
blk.15.ffn_up.weightI16[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightI16[28672 8192]
-
blk.16.ffn_gate.weightI16[8192 28672]
-
blk.16.ffn_up.weightI16[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightI16[8192 1024]
-
blk.16.attn_output.weightI16[8192 8192]
-
blk.16.attn_q.weightI16[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightI16[28672 8192]
-
blk.17.ffn_gate.weightI16[8192 28672]
-
blk.17.ffn_up.weightI16[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightI16[8192 1024]
-
blk.17.attn_output.weightI16[8192 8192]
-
blk.17.attn_q.weightI16[8192 8192]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_k.weightI16[8192 1024]
-
blk.18.attn_output.weightI16[8192 8192]
-
blk.18.attn_q.weightI16[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightI16[28672 8192]
-
blk.18.ffn_gate.weightI16[8192 28672]
-
blk.18.ffn_up.weightI16[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightI16[28672 8192]
-
blk.19.ffn_gate.weightI16[8192 28672]
-
blk.19.ffn_up.weightI16[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightI16[8192 1024]
-
blk.19.attn_output.weightI16[8192 8192]
-
blk.19.attn_q.weightI16[8192 8192]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightI16[28672 8192]
-
blk.20.ffn_gate.weightI16[8192 28672]
-
blk.20.ffn_up.weightI16[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightI16[8192 1024]
-
blk.20.attn_output.weightI16[8192 8192]
-
blk.20.attn_q.weightI16[8192 8192]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_k.weightI16[8192 1024]
-
blk.21.attn_q.weightI16[8192 8192]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightI16[28672 8192]
-
blk.21.ffn_gate.weightI16[8192 28672]
-
blk.21.ffn_up.weightI16[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightI16[8192 8192]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightI16[28672 8192]
-
blk.22.ffn_gate.weightI16[8192 28672]
-
blk.22.ffn_up.weightI16[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightI16[8192 1024]
-
blk.22.attn_output.weightI16[8192 8192]
-
blk.22.attn_q.weightI16[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightI16[28672 8192]
-
blk.23.ffn_gate.weightI16[8192 28672]
-
blk.23.ffn_up.weightI16[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightI16[8192 1024]
-
blk.23.attn_output.weightI16[8192 8192]
-
blk.23.attn_q.weightI16[8192 8192]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightI16[28672 8192]
-
blk.24.ffn_gate.weightI16[8192 28672]
-
blk.24.ffn_up.weightI16[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightI16[8192 1024]
-
blk.24.attn_output.weightI16[8192 8192]
-
blk.24.attn_q.weightI16[8192 8192]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightI16[28672 8192]
-
blk.25.ffn_gate.weightI16[8192 28672]
-
blk.25.ffn_up.weightI16[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightI16[8192 1024]
-
blk.25.attn_output.weightI16[8192 8192]
-
blk.25.attn_q.weightI16[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.ffn_gate.weightI16[8192 28672]
-
blk.26.ffn_up.weightI16[8192 28672]
-
blk.26.attn_k.weightI16[8192 1024]
-
blk.26.attn_output.weightI16[8192 8192]
-
blk.26.attn_q.weightI16[8192 8192]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightI16[28672 8192]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightI16[28672 8192]
-
blk.27.ffn_gate.weightI16[8192 28672]
-
blk.27.ffn_up.weightI16[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightI16[8192 1024]
-
blk.27.attn_output.weightI16[8192 8192]
-
blk.27.attn_q.weightI16[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightI16[28672 8192]
-
blk.28.ffn_gate.weightI16[8192 28672]
-
blk.28.ffn_up.weightI16[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightI16[8192 1024]
-
blk.28.attn_output.weightI16[8192 8192]
-
blk.28.attn_q.weightI16[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.ffn_gate.weightI16[8192 28672]
-
blk.29.attn_k.weightI16[8192 1024]
-
blk.29.attn_output.weightI16[8192 8192]
-
blk.29.attn_q.weightI16[8192 8192]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightI16[28672 8192]
-
blk.29.ffn_up.weightI16[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightI16[28672 8192]
-
blk.30.ffn_gate.weightI16[8192 28672]
-
blk.30.ffn_up.weightI16[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightI16[8192 1024]
-
blk.30.attn_output.weightI16[8192 8192]
-
blk.30.attn_q.weightI16[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightI16[28672 8192]
-
blk.31.ffn_gate.weightI16[8192 28672]
-
blk.31.ffn_up.weightI16[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightI16[8192 1024]
-
blk.31.attn_output.weightI16[8192 8192]
-
blk.31.attn_q.weightI16[8192 8192]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_k.weightI16[8192 1024]
-
blk.32.attn_output.weightI16[8192 8192]
-
blk.32.attn_q.weightI16[8192 8192]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightI16[28672 8192]
-
blk.32.ffn_gate.weightI16[8192 28672]
-
blk.32.ffn_up.weightI16[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightI16[28672 8192]
-
blk.33.ffn_gate.weightI16[8192 28672]
-
blk.33.ffn_up.weightI16[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightI16[8192 1024]
-
blk.33.attn_output.weightI16[8192 8192]
-
blk.33.attn_q.weightI16[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightI16[28672 8192]
-
blk.34.ffn_gate.weightI16[8192 28672]
-
blk.34.ffn_up.weightI16[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightI16[8192 1024]
-
blk.34.attn_output.weightI16[8192 8192]
-
blk.34.attn_q.weightI16[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_k.weightI16[8192 1024]
-
blk.35.attn_q.weightI16[8192 8192]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightI16[28672 8192]
-
blk.35.ffn_gate.weightI16[8192 28672]
-
blk.35.ffn_up.weightI16[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_output.weightI16[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightI16[28672 8192]
-
blk.36.ffn_gate.weightI16[8192 28672]
-
blk.36.ffn_up.weightI16[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightI16[8192 1024]
-
blk.36.attn_output.weightI16[8192 8192]
-
blk.36.attn_q.weightI16[8192 8192]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightI16[28672 8192]
-
blk.37.ffn_gate.weightI16[8192 28672]
-
blk.37.ffn_up.weightI16[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightI16[8192 1024]
-
blk.37.attn_output.weightI16[8192 8192]
-
blk.37.attn_q.weightI16[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightI16[28672 8192]
-
blk.38.ffn_gate.weightI16[8192 28672]
-
blk.38.ffn_up.weightI16[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightI16[8192 1024]
-
blk.38.attn_output.weightI16[8192 8192]
-
blk.38.attn_q.weightI16[8192 8192]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightI16[28672 8192]
-
blk.39.ffn_gate.weightI16[8192 28672]
-
blk.39.ffn_up.weightI16[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightI16[8192 1024]
-
blk.39.attn_output.weightI16[8192 8192]
-
blk.39.attn_q.weightI16[8192 8192]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.ffn_gate.weightI16[8192 28672]
-
blk.40.ffn_up.weightI16[8192 28672]
-
blk.40.attn_k.weightI16[8192 1024]
-
blk.40.attn_output.weightI16[8192 8192]
-
blk.40.attn_q.weightI16[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightI16[28672 8192]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightI16[28672 8192]
-
blk.41.ffn_gate.weightI16[8192 28672]
-
blk.41.ffn_up.weightI16[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightI16[8192 1024]
-
blk.41.attn_output.weightI16[8192 8192]
-
blk.41.attn_q.weightI16[8192 8192]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightI16[28672 8192]
-
blk.42.ffn_gate.weightI16[8192 28672]
-
blk.42.ffn_up.weightI16[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightI16[8192 1024]
-
blk.42.attn_output.weightI16[8192 8192]
-
blk.42.attn_q.weightI16[8192 8192]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.43.ffn_gate.weightI16[8192 28672]
-
blk.43.attn_k.weightI16[8192 1024]
-
blk.43.attn_output.weightI16[8192 8192]
-
blk.43.attn_q.weightI16[8192 8192]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightI16[28672 8192]
-
blk.43.ffn_up.weightI16[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightI16[28672 8192]
-
blk.44.ffn_gate.weightI16[8192 28672]
-
blk.44.ffn_up.weightI16[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightI16[8192 1024]
-
blk.44.attn_output.weightI16[8192 8192]
-
blk.44.attn_q.weightI16[8192 8192]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightI16[28672 8192]
-
blk.45.ffn_gate.weightI16[8192 28672]
-
blk.45.ffn_up.weightI16[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightI16[8192 1024]
-
blk.45.attn_output.weightI16[8192 8192]
-
blk.45.attn_q.weightI16[8192 8192]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_k.weightI16[8192 1024]
-
blk.46.attn_output.weightI16[8192 8192]
-
blk.46.attn_q.weightI16[8192 8192]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightI16[28672 8192]
-
blk.46.ffn_gate.weightI16[8192 28672]
-
blk.46.ffn_up.weightI16[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightI16[28672 8192]
-
blk.47.ffn_gate.weightI16[8192 28672]
-
blk.47.ffn_up.weightI16[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightI16[8192 1024]
-
blk.47.attn_output.weightI16[8192 8192]
-
blk.47.attn_q.weightI16[8192 8192]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightI16[28672 8192]
-
blk.48.ffn_gate.weightI16[8192 28672]
-
blk.48.ffn_up.weightI16[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightI16[8192 1024]
-
blk.48.attn_output.weightI16[8192 8192]
-
blk.48.attn_q.weightI16[8192 8192]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_k.weightI16[8192 1024]
-
blk.49.attn_q.weightI16[8192 8192]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightI16[28672 8192]
-
blk.49.ffn_gate.weightI16[8192 28672]
-
blk.49.ffn_up.weightI16[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightI16[8192 8192]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightI16[28672 8192]
-
blk.50.ffn_gate.weightI16[8192 28672]
-
blk.50.ffn_up.weightI16[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.weightI16[8192 1024]
-
blk.50.attn_output.weightI16[8192 8192]
-
blk.50.attn_q.weightI16[8192 8192]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightI16[28672 8192]
-
blk.51.ffn_gate.weightI16[8192 28672]
-
blk.51.ffn_up.weightI16[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightI16[8192 1024]
-
blk.51.attn_output.weightI16[8192 8192]
-
blk.51.attn_q.weightI16[8192 8192]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightI16[28672 8192]
-
blk.52.ffn_gate.weightI16[8192 28672]
-
blk.52.ffn_up.weightI16[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightI16[8192 1024]
-
blk.52.attn_output.weightI16[8192 8192]
-
blk.52.attn_q.weightI16[8192 8192]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightI16[28672 8192]
-
blk.53.ffn_gate.weightI16[8192 28672]
-
blk.53.ffn_up.weightI16[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightI16[8192 1024]
-
blk.53.attn_output.weightI16[8192 8192]
-
blk.53.attn_q.weightI16[8192 8192]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.54.ffn_gate.weightI16[8192 28672]
-
blk.54.ffn_up.weightI16[8192 28672]
-
blk.54.attn_k.weightI16[8192 1024]
-
blk.54.attn_output.weightI16[8192 8192]
-
blk.54.attn_q.weightI16[8192 8192]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightI16[28672 8192]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightI16[28672 8192]
-
blk.55.ffn_gate.weightI16[8192 28672]
-
blk.55.ffn_up.weightI16[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightI16[8192 1024]
-
blk.55.attn_output.weightI16[8192 8192]
-
blk.55.attn_q.weightI16[8192 8192]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightI16[28672 8192]
-
blk.56.ffn_gate.weightI16[8192 28672]
-
blk.56.ffn_up.weightI16[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightI16[8192 1024]
-
blk.56.attn_output.weightI16[8192 8192]
-
blk.56.attn_q.weightI16[8192 8192]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.57.ffn_gate.weightI16[8192 28672]
-
blk.57.attn_k.weightI16[8192 1024]
-
blk.57.attn_output.weightI16[8192 8192]
-
blk.57.attn_q.weightI16[8192 8192]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightI16[28672 8192]
-
blk.57.ffn_up.weightI16[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightI16[28672 8192]
-
blk.58.ffn_gate.weightI16[8192 28672]
-
blk.58.ffn_up.weightI16[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightI16[8192 1024]
-
blk.58.attn_output.weightI16[8192 8192]
-
blk.58.attn_q.weightI16[8192 8192]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightI16[28672 8192]
-
blk.59.ffn_gate.weightI16[8192 28672]
-
blk.59.ffn_up.weightI16[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightI16[8192 1024]
-
blk.59.attn_output.weightI16[8192 8192]
-
blk.59.attn_q.weightI16[8192 8192]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_k.weightI16[8192 1024]
-
blk.60.attn_output.weightI16[8192 8192]
-
blk.60.attn_q.weightI16[8192 8192]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightI16[28672 8192]
-
blk.60.ffn_gate.weightI16[8192 28672]
-
blk.60.ffn_up.weightI16[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightI16[28672 8192]
-
blk.61.ffn_gate.weightI16[8192 28672]
-
blk.61.ffn_up.weightI16[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.weightI16[8192 1024]
-
blk.61.attn_output.weightI16[8192 8192]
-
blk.61.attn_q.weightI16[8192 8192]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightI16[28672 8192]
-
blk.62.ffn_gate.weightI16[8192 28672]
-
blk.62.ffn_up.weightI16[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightI16[8192 1024]
-
blk.62.attn_output.weightI16[8192 8192]
-
blk.62.attn_q.weightI16[8192 8192]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_k.weightI16[8192 1024]
-
blk.63.attn_q.weightI16[8192 8192]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightI16[28672 8192]
-
blk.63.ffn_gate.weightI16[8192 28672]
-
blk.63.ffn_up.weightI16[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_output.weightI16[8192 8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightI16[28672 8192]
-
blk.64.ffn_gate.weightI16[8192 28672]
-
blk.64.ffn_up.weightI16[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.weightI16[8192 1024]
-
blk.64.attn_output.weightI16[8192 8192]
-
blk.64.attn_q.weightI16[8192 8192]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightI16[28672 8192]
-
blk.65.ffn_gate.weightI16[8192 28672]
-
blk.65.ffn_up.weightI16[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightI16[8192 1024]
-
blk.65.attn_output.weightI16[8192 8192]
-
blk.65.attn_q.weightI16[8192 8192]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightI16[28672 8192]
-
blk.66.ffn_gate.weightI16[8192 28672]
-
blk.66.ffn_up.weightI16[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightI16[8192 1024]
-
blk.66.attn_output.weightI16[8192 8192]
-
blk.66.attn_q.weightI16[8192 8192]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightI16[28672 8192]
-
blk.67.ffn_gate.weightI16[8192 28672]
-
blk.67.ffn_up.weightI16[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightI16[8192 1024]
-
blk.67.attn_output.weightI16[8192 8192]
-
blk.67.attn_q.weightI16[8192 8192]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.68.ffn_gate.weightI16[8192 28672]
-
blk.68.ffn_up.weightI16[8192 28672]
-
blk.68.attn_k.weightI16[8192 1024]
-
blk.68.attn_output.weightI16[8192 8192]
-
blk.68.attn_q.weightI16[8192 8192]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightI16[28672 8192]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightI16[28672 8192]
-
blk.69.ffn_gate.weightI16[8192 28672]
-
blk.69.ffn_up.weightI16[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightI16[8192 1024]
-
blk.69.attn_output.weightI16[8192 8192]
-
blk.69.attn_q.weightI16[8192 8192]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightI16[28672 8192]
-
blk.70.ffn_gate.weightI16[8192 28672]
-
blk.70.ffn_up.weightI16[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightI16[8192 1024]
-
blk.70.attn_output.weightI16[8192 8192]
-
blk.70.attn_q.weightI16[8192 8192]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.71.ffn_gate.weightI16[8192 28672]
-
blk.71.attn_k.weightI16[8192 1024]
-
blk.71.attn_output.weightI16[8192 8192]
-
blk.71.attn_q.weightI16[8192 8192]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightI16[28672 8192]
-
blk.71.ffn_up.weightI16[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightI16[28672 8192]
-
blk.72.ffn_gate.weightI16[8192 28672]
-
blk.72.ffn_up.weightI16[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightI16[8192 1024]
-
blk.72.attn_output.weightI16[8192 8192]
-
blk.72.attn_q.weightI16[8192 8192]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightI16[28672 8192]
-
blk.73.ffn_gate.weightI16[8192 28672]
-
blk.73.ffn_up.weightI16[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightI16[8192 1024]
-
blk.73.attn_output.weightI16[8192 8192]
-
blk.73.attn_q.weightI16[8192 8192]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_k.weightI16[8192 1024]
-
blk.74.attn_output.weightI16[8192 8192]
-
blk.74.attn_q.weightI16[8192 8192]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightI16[28672 8192]
-
blk.74.ffn_gate.weightI16[8192 28672]
-
blk.74.ffn_up.weightI16[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightI16[28672 8192]
-
blk.75.ffn_gate.weightI16[8192 28672]
-
blk.75.ffn_up.weightI16[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.weightI16[8192 1024]
-
blk.75.attn_output.weightI16[8192 8192]
-
blk.75.attn_q.weightI16[8192 8192]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightI16[28672 8192]
-
blk.76.ffn_gate.weightI16[8192 28672]
-
blk.76.ffn_up.weightI16[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightI16[8192 1024]
-
blk.76.attn_output.weightI16[8192 8192]
-
blk.76.attn_q.weightI16[8192 8192]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_k.weightI16[8192 1024]
-
blk.77.attn_q.weightI16[8192 8192]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightI16[28672 8192]
-
blk.77.ffn_gate.weightI16[8192 28672]
-
blk.77.ffn_up.weightI16[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightI16[8192 8192]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightI16[28672 8192]
-
blk.78.ffn_gate.weightI16[8192 28672]
-
blk.78.ffn_up.weightI16[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.weightI16[8192 1024]
-
blk.78.attn_output.weightI16[8192 8192]
-
blk.78.attn_q.weightI16[8192 8192]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightI16[28672 8192]
-
blk.79.ffn_gate.weightI16[8192 28672]
-
blk.79.ffn_up.weightI16[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightI16[8192 1024]
-
blk.79.attn_output.weightI16[8192 8192]
-
blk.79.attn_q.weightI16[8192 8192]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
output_norm.weightF32[8192]
-
output.weightQ5_K[8192 128256]
-
rope_freqs.weightF32[64]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79