iq2_xs quant
70B
62 Pulls Updated 7 weeks ago
7c9f39a2cd7c · 21GB
-
quantize.imatrix.chunks_count68
-
quantize.imatrix.datasetgroup_40.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file./Meta-Llama-3.1-70B-Instruct-GGUF_imatrix.dat
-
general.architecturellama
-
general.file_typeIQ2_XS
-
general.quantization_version2
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length131072
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ Ġ ĠĠĠ ĠĠ ĠĠ ĠĠĠ Ġ i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 128256]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ2_K[28672 8192]
-
blk.0.ffn_gate.weightI16[8192 28672]
-
blk.0.ffn_up.weightI16[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightI16[8192 1024]
-
blk.0.attn_output.weightI16[8192 8192]
-
blk.0.attn_q.weightI16[8192 8192]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.1.ffn_gate.weightI16[8192 28672]
-
blk.1.attn_k.weightI16[8192 1024]
-
blk.1.attn_output.weightI16[8192 8192]
-
blk.1.attn_q.weightI16[8192 8192]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ2_K[28672 8192]
-
blk.1.ffn_up.weightI16[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ2_K[28672 8192]
-
blk.2.ffn_gate.weightI16[8192 28672]
-
blk.2.ffn_up.weightI16[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightI16[8192 1024]
-
blk.2.attn_output.weightI16[8192 8192]
-
blk.2.attn_q.weightI16[8192 8192]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ2_K[28672 8192]
-
blk.3.ffn_gate.weightI16[8192 28672]
-
blk.3.ffn_up.weightI16[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightI16[8192 1024]
-
blk.3.attn_output.weightI16[8192 8192]
-
blk.3.attn_q.weightI16[8192 8192]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_k.weightI16[8192 1024]
-
blk.4.attn_output.weightI16[8192 8192]
-
blk.4.attn_q.weightI16[8192 8192]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ2_K[28672 8192]
-
blk.4.ffn_gate.weightI16[8192 28672]
-
blk.4.ffn_up.weightI16[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ2_K[28672 8192]
-
blk.5.ffn_gate.weightI16[8192 28672]
-
blk.5.ffn_up.weightI16[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightI16[8192 1024]
-
blk.5.attn_output.weightI16[8192 8192]
-
blk.5.attn_q.weightI16[8192 8192]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ2_K[28672 8192]
-
blk.6.ffn_gate.weightI16[8192 28672]
-
blk.6.ffn_up.weightI16[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightI16[8192 1024]
-
blk.6.attn_output.weightI16[8192 8192]
-
blk.6.attn_q.weightI16[8192 8192]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_k.weightI16[8192 1024]
-
blk.7.attn_q.weightI16[8192 8192]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ2_K[28672 8192]
-
blk.7.ffn_gate.weightI16[8192 28672]
-
blk.7.ffn_up.weightI16[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_output.weightI16[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ2_K[28672 8192]
-
blk.8.ffn_gate.weightI16[8192 28672]
-
blk.8.ffn_up.weightI16[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightI16[8192 1024]
-
blk.8.attn_output.weightI16[8192 8192]
-
blk.8.attn_q.weightI16[8192 8192]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ2_K[28672 8192]
-
blk.9.ffn_gate.weightI16[8192 28672]
-
blk.9.ffn_up.weightI16[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightI16[8192 1024]
-
blk.9.attn_output.weightI16[8192 8192]
-
blk.9.attn_q.weightI16[8192 8192]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightI16[28672 8192]
-
blk.10.ffn_gate.weightI16[8192 28672]
-
blk.10.ffn_up.weightI16[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightI16[8192 1024]
-
blk.10.attn_output.weightI16[8192 8192]
-
blk.10.attn_q.weightI16[8192 8192]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightI16[28672 8192]
-
blk.11.ffn_gate.weightI16[8192 28672]
-
blk.11.ffn_up.weightI16[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightI16[8192 1024]
-
blk.11.attn_output.weightI16[8192 8192]
-
blk.11.attn_q.weightI16[8192 8192]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.12.ffn_gate.weightI16[8192 28672]
-
blk.12.ffn_up.weightI16[8192 28672]
-
blk.12.attn_k.weightI16[8192 1024]
-
blk.12.attn_output.weightI16[8192 8192]
-
blk.12.attn_q.weightI16[8192 8192]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightI16[28672 8192]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightI16[28672 8192]
-
blk.13.ffn_gate.weightI16[8192 28672]
-
blk.13.ffn_up.weightI16[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightI16[8192 1024]
-
blk.13.attn_output.weightI16[8192 8192]
-
blk.13.attn_q.weightI16[8192 8192]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightI16[28672 8192]
-
blk.14.ffn_gate.weightI16[8192 28672]
-
blk.14.ffn_up.weightI16[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightI16[8192 1024]
-
blk.14.attn_output.weightI16[8192 8192]
-
blk.14.attn_q.weightI16[8192 8192]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.15.ffn_gate.weightI16[8192 28672]
-
blk.15.attn_k.weightI16[8192 1024]
-
blk.15.attn_output.weightI16[8192 8192]
-
blk.15.attn_q.weightI16[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightI16[28672 8192]
-
blk.15.ffn_up.weightI16[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightI16[28672 8192]
-
blk.16.ffn_gate.weightI16[8192 28672]
-
blk.16.ffn_up.weightI16[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightI16[8192 1024]
-
blk.16.attn_output.weightI16[8192 8192]
-
blk.16.attn_q.weightI16[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightI16[28672 8192]
-
blk.17.ffn_gate.weightI16[8192 28672]
-
blk.17.ffn_up.weightI16[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightI16[8192 1024]
-
blk.17.attn_output.weightI16[8192 8192]
-
blk.17.attn_q.weightI16[8192 8192]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_k.weightI16[8192 1024]
-
blk.18.attn_output.weightI16[8192 8192]
-
blk.18.attn_q.weightI16[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightI16[28672 8192]
-
blk.18.ffn_gate.weightI16[8192 28672]
-
blk.18.ffn_up.weightI16[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightI16[28672 8192]
-
blk.19.ffn_gate.weightI16[8192 28672]
-
blk.19.ffn_up.weightI16[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightI16[8192 1024]
-
blk.19.attn_output.weightI16[8192 8192]
-
blk.19.attn_q.weightI16[8192 8192]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightI16[28672 8192]
-
blk.20.ffn_gate.weightI16[8192 28672]
-
blk.20.ffn_up.weightI16[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightI16[8192 1024]
-
blk.20.attn_output.weightI16[8192 8192]
-
blk.20.attn_q.weightI16[8192 8192]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_k.weightI16[8192 1024]
-
blk.21.attn_q.weightI16[8192 8192]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightI16[28672 8192]
-
blk.21.ffn_gate.weightI16[8192 28672]
-
blk.21.ffn_up.weightI16[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightI16[8192 8192]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightI16[28672 8192]
-
blk.22.ffn_gate.weightI16[8192 28672]
-
blk.22.ffn_up.weightI16[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightI16[8192 1024]
-
blk.22.attn_output.weightI16[8192 8192]
-
blk.22.attn_q.weightI16[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightI16[28672 8192]
-
blk.23.ffn_gate.weightI16[8192 28672]
-
blk.23.ffn_up.weightI16[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightI16[8192 1024]
-
blk.23.attn_output.weightI16[8192 8192]
-
blk.23.attn_q.weightI16[8192 8192]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightI16[28672 8192]
-
blk.24.ffn_gate.weightI16[8192 28672]
-
blk.24.ffn_up.weightI16[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightI16[8192 1024]
-
blk.24.attn_output.weightI16[8192 8192]
-
blk.24.attn_q.weightI16[8192 8192]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightI16[28672 8192]
-
blk.25.ffn_gate.weightI16[8192 28672]
-
blk.25.ffn_up.weightI16[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightI16[8192 1024]
-
blk.25.attn_output.weightI16[8192 8192]
-
blk.25.attn_q.weightI16[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.ffn_gate.weightI16[8192 28672]
-
blk.26.ffn_up.weightI16[8192 28672]
-
blk.26.attn_k.weightI16[8192 1024]
-
blk.26.attn_output.weightI16[8192 8192]
-
blk.26.attn_q.weightI16[8192 8192]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightI16[28672 8192]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightI16[28672 8192]
-
blk.27.ffn_gate.weightI16[8192 28672]
-
blk.27.ffn_up.weightI16[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightI16[8192 1024]
-
blk.27.attn_output.weightI16[8192 8192]
-
blk.27.attn_q.weightI16[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightI16[28672 8192]
-
blk.28.ffn_gate.weightI16[8192 28672]
-
blk.28.ffn_up.weightI16[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightI16[8192 1024]
-
blk.28.attn_output.weightI16[8192 8192]
-
blk.28.attn_q.weightI16[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.ffn_gate.weightI16[8192 28672]
-
blk.29.attn_k.weightI16[8192 1024]
-
blk.29.attn_output.weightI16[8192 8192]
-
blk.29.attn_q.weightI16[8192 8192]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightI16[28672 8192]
-
blk.29.ffn_up.weightI16[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightI16[28672 8192]
-
blk.30.ffn_gate.weightI16[8192 28672]
-
blk.30.ffn_up.weightI16[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightI16[8192 1024]
-
blk.30.attn_output.weightI16[8192 8192]
-
blk.30.attn_q.weightI16[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightI16[28672 8192]
-
blk.31.ffn_gate.weightI16[8192 28672]
-
blk.31.ffn_up.weightI16[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightI16[8192 1024]
-
blk.31.attn_output.weightI16[8192 8192]
-
blk.31.attn_q.weightI16[8192 8192]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_k.weightI16[8192 1024]
-
blk.32.attn_output.weightI16[8192 8192]
-
blk.32.attn_q.weightI16[8192 8192]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightI16[28672 8192]
-
blk.32.ffn_gate.weightI16[8192 28672]
-
blk.32.ffn_up.weightI16[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightI16[28672 8192]
-
blk.33.ffn_gate.weightI16[8192 28672]
-
blk.33.ffn_up.weightI16[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightI16[8192 1024]
-
blk.33.attn_output.weightI16[8192 8192]
-
blk.33.attn_q.weightI16[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightI16[28672 8192]
-
blk.34.ffn_gate.weightI16[8192 28672]
-
blk.34.ffn_up.weightI16[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightI16[8192 1024]
-
blk.34.attn_output.weightI16[8192 8192]
-
blk.34.attn_q.weightI16[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_k.weightI16[8192 1024]
-
blk.35.attn_q.weightI16[8192 8192]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightI16[28672 8192]
-
blk.35.ffn_gate.weightI16[8192 28672]
-
blk.35.ffn_up.weightI16[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_output.weightI16[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightI16[28672 8192]
-
blk.36.ffn_gate.weightI16[8192 28672]
-
blk.36.ffn_up.weightI16[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightI16[8192 1024]
-
blk.36.attn_output.weightI16[8192 8192]
-
blk.36.attn_q.weightI16[8192 8192]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightI16[28672 8192]
-
blk.37.ffn_gate.weightI16[8192 28672]
-
blk.37.ffn_up.weightI16[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightI16[8192 1024]
-
blk.37.attn_output.weightI16[8192 8192]
-
blk.37.attn_q.weightI16[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightI16[28672 8192]
-
blk.38.ffn_gate.weightI16[8192 28672]
-
blk.38.ffn_up.weightI16[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightI16[8192 1024]
-
blk.38.attn_output.weightI16[8192 8192]
-
blk.38.attn_q.weightI16[8192 8192]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightI16[28672 8192]
-
blk.39.ffn_gate.weightI16[8192 28672]
-
blk.39.ffn_up.weightI16[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightI16[8192 1024]
-
blk.39.attn_output.weightI16[8192 8192]
-
blk.39.attn_q.weightI16[8192 8192]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.ffn_gate.weightI16[8192 28672]
-
blk.40.ffn_up.weightI16[8192 28672]
-
blk.40.attn_k.weightI16[8192 1024]
-
blk.40.attn_output.weightI16[8192 8192]
-
blk.40.attn_q.weightI16[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightI16[28672 8192]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightI16[28672 8192]
-
blk.41.ffn_gate.weightI16[8192 28672]
-
blk.41.ffn_up.weightI16[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightI16[8192 1024]
-
blk.41.attn_output.weightI16[8192 8192]
-
blk.41.attn_q.weightI16[8192 8192]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightI16[28672 8192]
-
blk.42.ffn_gate.weightI16[8192 28672]
-
blk.42.ffn_up.weightI16[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightI16[8192 1024]
-
blk.42.attn_output.weightI16[8192 8192]
-
blk.42.attn_q.weightI16[8192 8192]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.43.ffn_gate.weightI16[8192 28672]
-
blk.43.attn_k.weightI16[8192 1024]
-
blk.43.attn_output.weightI16[8192 8192]
-
blk.43.attn_q.weightI16[8192 8192]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightI16[28672 8192]
-
blk.43.ffn_up.weightI16[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightI16[28672 8192]
-
blk.44.ffn_gate.weightI16[8192 28672]
-
blk.44.ffn_up.weightI16[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightI16[8192 1024]
-
blk.44.attn_output.weightI16[8192 8192]
-
blk.44.attn_q.weightI16[8192 8192]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightI16[28672 8192]
-
blk.45.ffn_gate.weightI16[8192 28672]
-
blk.45.ffn_up.weightI16[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightI16[8192 1024]
-
blk.45.attn_output.weightI16[8192 8192]
-
blk.45.attn_q.weightI16[8192 8192]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_k.weightI16[8192 1024]
-
blk.46.attn_output.weightI16[8192 8192]
-
blk.46.attn_q.weightI16[8192 8192]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightI16[28672 8192]
-
blk.46.ffn_gate.weightI16[8192 28672]
-
blk.46.ffn_up.weightI16[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightI16[28672 8192]
-
blk.47.ffn_gate.weightI16[8192 28672]
-
blk.47.ffn_up.weightI16[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightI16[8192 1024]
-
blk.47.attn_output.weightI16[8192 8192]
-
blk.47.attn_q.weightI16[8192 8192]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightI16[28672 8192]
-
blk.48.ffn_gate.weightI16[8192 28672]
-
blk.48.ffn_up.weightI16[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightI16[8192 1024]
-
blk.48.attn_output.weightI16[8192 8192]
-
blk.48.attn_q.weightI16[8192 8192]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_k.weightI16[8192 1024]
-
blk.49.attn_q.weightI16[8192 8192]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightI16[28672 8192]
-
blk.49.ffn_gate.weightI16[8192 28672]
-
blk.49.ffn_up.weightI16[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightI16[8192 8192]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightI16[28672 8192]
-
blk.50.ffn_gate.weightI16[8192 28672]
-
blk.50.ffn_up.weightI16[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.weightI16[8192 1024]
-
blk.50.attn_output.weightI16[8192 8192]
-
blk.50.attn_q.weightI16[8192 8192]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightI16[28672 8192]
-
blk.51.ffn_gate.weightI16[8192 28672]
-
blk.51.ffn_up.weightI16[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightI16[8192 1024]
-
blk.51.attn_output.weightI16[8192 8192]
-
blk.51.attn_q.weightI16[8192 8192]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightI16[28672 8192]
-
blk.52.ffn_gate.weightI16[8192 28672]
-
blk.52.ffn_up.weightI16[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightI16[8192 1024]
-
blk.52.attn_output.weightI16[8192 8192]
-
blk.52.attn_q.weightI16[8192 8192]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightI16[28672 8192]
-
blk.53.ffn_gate.weightI16[8192 28672]
-
blk.53.ffn_up.weightI16[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightI16[8192 1024]
-
blk.53.attn_output.weightI16[8192 8192]
-
blk.53.attn_q.weightI16[8192 8192]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.54.ffn_gate.weightI16[8192 28672]
-
blk.54.ffn_up.weightI16[8192 28672]
-
blk.54.attn_k.weightI16[8192 1024]
-
blk.54.attn_output.weightI16[8192 8192]
-
blk.54.attn_q.weightI16[8192 8192]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightI16[28672 8192]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightI16[28672 8192]
-
blk.55.ffn_gate.weightI16[8192 28672]
-
blk.55.ffn_up.weightI16[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightI16[8192 1024]
-
blk.55.attn_output.weightI16[8192 8192]
-
blk.55.attn_q.weightI16[8192 8192]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightI16[28672 8192]
-
blk.56.ffn_gate.weightI16[8192 28672]
-
blk.56.ffn_up.weightI16[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightI16[8192 1024]
-
blk.56.attn_output.weightI16[8192 8192]
-
blk.56.attn_q.weightI16[8192 8192]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.57.ffn_gate.weightI16[8192 28672]
-
blk.57.attn_k.weightI16[8192 1024]
-
blk.57.attn_output.weightI16[8192 8192]
-
blk.57.attn_q.weightI16[8192 8192]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightI16[28672 8192]
-
blk.57.ffn_up.weightI16[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightI16[28672 8192]
-
blk.58.ffn_gate.weightI16[8192 28672]
-
blk.58.ffn_up.weightI16[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightI16[8192 1024]
-
blk.58.attn_output.weightI16[8192 8192]
-
blk.58.attn_q.weightI16[8192 8192]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightI16[28672 8192]
-
blk.59.ffn_gate.weightI16[8192 28672]
-
blk.59.ffn_up.weightI16[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightI16[8192 1024]
-
blk.59.attn_output.weightI16[8192 8192]
-
blk.59.attn_q.weightI16[8192 8192]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_k.weightI16[8192 1024]
-
blk.60.attn_output.weightI16[8192 8192]
-
blk.60.attn_q.weightI16[8192 8192]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightI16[28672 8192]
-
blk.60.ffn_gate.weightI16[8192 28672]
-
blk.60.ffn_up.weightI16[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightI16[28672 8192]
-
blk.61.ffn_gate.weightI16[8192 28672]
-
blk.61.ffn_up.weightI16[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.weightI16[8192 1024]
-
blk.61.attn_output.weightI16[8192 8192]
-
blk.61.attn_q.weightI16[8192 8192]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightI16[28672 8192]
-
blk.62.ffn_gate.weightI16[8192 28672]
-
blk.62.ffn_up.weightI16[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightI16[8192 1024]
-
blk.62.attn_output.weightI16[8192 8192]
-
blk.62.attn_q.weightI16[8192 8192]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_k.weightI16[8192 1024]
-
blk.63.attn_q.weightI16[8192 8192]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightI16[28672 8192]
-
blk.63.ffn_gate.weightI16[8192 28672]
-
blk.63.ffn_up.weightI16[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_output.weightI16[8192 8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightI16[28672 8192]
-
blk.64.ffn_gate.weightI16[8192 28672]
-
blk.64.ffn_up.weightI16[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.weightI16[8192 1024]
-
blk.64.attn_output.weightI16[8192 8192]
-
blk.64.attn_q.weightI16[8192 8192]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightI16[28672 8192]
-
blk.65.ffn_gate.weightI16[8192 28672]
-
blk.65.ffn_up.weightI16[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightI16[8192 1024]
-
blk.65.attn_output.weightI16[8192 8192]
-
blk.65.attn_q.weightI16[8192 8192]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightI16[28672 8192]
-
blk.66.ffn_gate.weightI16[8192 28672]
-
blk.66.ffn_up.weightI16[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightI16[8192 1024]
-
blk.66.attn_output.weightI16[8192 8192]
-
blk.66.attn_q.weightI16[8192 8192]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightI16[28672 8192]
-
blk.67.ffn_gate.weightI16[8192 28672]
-
blk.67.ffn_up.weightI16[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightI16[8192 1024]
-
blk.67.attn_output.weightI16[8192 8192]
-
blk.67.attn_q.weightI16[8192 8192]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.68.ffn_gate.weightI16[8192 28672]
-
blk.68.ffn_up.weightI16[8192 28672]
-
blk.68.attn_k.weightI16[8192 1024]
-
blk.68.attn_output.weightI16[8192 8192]
-
blk.68.attn_q.weightI16[8192 8192]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightI16[28672 8192]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightI16[28672 8192]
-
blk.69.ffn_gate.weightI16[8192 28672]
-
blk.69.ffn_up.weightI16[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightI16[8192 1024]
-
blk.69.attn_output.weightI16[8192 8192]
-
blk.69.attn_q.weightI16[8192 8192]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightI16[28672 8192]
-
blk.70.ffn_gate.weightI16[8192 28672]
-
blk.70.ffn_up.weightI16[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightI16[8192 1024]
-
blk.70.attn_output.weightI16[8192 8192]
-
blk.70.attn_q.weightI16[8192 8192]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.71.ffn_gate.weightI16[8192 28672]
-
blk.71.attn_k.weightI16[8192 1024]
-
blk.71.attn_output.weightI16[8192 8192]
-
blk.71.attn_q.weightI16[8192 8192]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightI16[28672 8192]
-
blk.71.ffn_up.weightI16[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightI16[28672 8192]
-
blk.72.ffn_gate.weightI16[8192 28672]
-
blk.72.ffn_up.weightI16[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightI16[8192 1024]
-
blk.72.attn_output.weightI16[8192 8192]
-
blk.72.attn_q.weightI16[8192 8192]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightI16[28672 8192]
-
blk.73.ffn_gate.weightI16[8192 28672]
-
blk.73.ffn_up.weightI16[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightI16[8192 1024]
-
blk.73.attn_output.weightI16[8192 8192]
-
blk.73.attn_q.weightI16[8192 8192]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_k.weightI16[8192 1024]
-
blk.74.attn_output.weightI16[8192 8192]
-
blk.74.attn_q.weightI16[8192 8192]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightI16[28672 8192]
-
blk.74.ffn_gate.weightI16[8192 28672]
-
blk.74.ffn_up.weightI16[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightI16[28672 8192]
-
blk.75.ffn_gate.weightI16[8192 28672]
-
blk.75.ffn_up.weightI16[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.weightI16[8192 1024]
-
blk.75.attn_output.weightI16[8192 8192]
-
blk.75.attn_q.weightI16[8192 8192]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightI16[28672 8192]
-
blk.76.ffn_gate.weightI16[8192 28672]
-
blk.76.ffn_up.weightI16[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightI16[8192 1024]
-
blk.76.attn_output.weightI16[8192 8192]
-
blk.76.attn_q.weightI16[8192 8192]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_k.weightI16[8192 1024]
-
blk.77.attn_q.weightI16[8192 8192]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightI16[28672 8192]
-
blk.77.ffn_gate.weightI16[8192 28672]
-
blk.77.ffn_up.weightI16[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightI16[8192 8192]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightI16[28672 8192]
-
blk.78.ffn_gate.weightI16[8192 28672]
-
blk.78.ffn_up.weightI16[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.weightI16[8192 1024]
-
blk.78.attn_output.weightI16[8192 8192]
-
blk.78.attn_q.weightI16[8192 8192]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightI16[28672 8192]
-
blk.79.ffn_gate.weightI16[8192 28672]
-
blk.79.ffn_up.weightI16[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightI16[8192 1024]
-
blk.79.attn_output.weightI16[8192 8192]
-
blk.79.attn_q.weightI16[8192 8192]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
output_norm.weightF32[8192]
-
output.weightQ5_K[8192 128256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79