latest
19GB
Reflection Llama-3.1 70B is (currently) the world's top open-source LLM, trained with a new technique called Reflection-Tuning that teaches a LLM to detect mistakes in its reasoning and correct course.
70B
195 Pulls Updated 13 days ago
b7e3ee581a28 · 19GB
-
quantize.imatrix.chunks_count125
-
quantize.imatrix.datasetReflection-Llama-3.1-70B-IMat-GGUF/imatrix.dataset
-
quantize.imatrix.entries_count560
-
quantize.imatrix.fileReflection-Llama-3.1-70B-IMat-GGUF/imatrix.dat
-
general.architecturellama
-
general.file_typeIQ2_XXS
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length8192
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128262
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ Ġ ĠĠĠ ĠĠ ĠĠ ĠĠĠ Ġ i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128009
-
tokenizer.ggml.prellama-bpe
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 128262]
-
blk.0.ffn_gate.weightI8[8192 28672]
-
blk.0.attn_k.weightI8[8192 1024]
-
blk.0.attn_output.weightI8[8192 8192]
-
blk.0.attn_q.weightI8[8192 8192]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ2_K[28672 8192]
-
blk.0.ffn_up.weightI8[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.1.ffn_gate.weightI8[8192 28672]
-
blk.1.attn_k.weightI8[8192 1024]
-
blk.1.attn_output.weightI8[8192 8192]
-
blk.1.attn_q.weightI8[8192 8192]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ2_K[28672 8192]
-
blk.1.ffn_up.weightI8[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.ffn_gate.weightI8[8192 28672]
-
blk.2.attn_k.weightI8[8192 1024]
-
blk.2.attn_output.weightI8[8192 8192]
-
blk.2.attn_q.weightI8[8192 8192]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ2_K[28672 8192]
-
blk.2.ffn_up.weightI8[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.ffn_gate.weightI8[8192 28672]
-
blk.3.attn_k.weightI8[8192 1024]
-
blk.3.attn_output.weightI8[8192 8192]
-
blk.3.attn_q.weightI8[8192 8192]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ2_K[28672 8192]
-
blk.3.ffn_up.weightI8[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.4.ffn_gate.weightI8[8192 28672]
-
blk.4.attn_k.weightI8[8192 1024]
-
blk.4.attn_output.weightI8[8192 8192]
-
blk.4.attn_q.weightI8[8192 8192]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ2_K[28672 8192]
-
blk.4.ffn_up.weightI8[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.ffn_gate.weightI8[8192 28672]
-
blk.5.attn_k.weightI8[8192 1024]
-
blk.5.attn_output.weightI8[8192 8192]
-
blk.5.attn_q.weightI8[8192 8192]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ2_K[28672 8192]
-
blk.5.ffn_up.weightI8[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.ffn_gate.weightI8[8192 28672]
-
blk.6.attn_k.weightI8[8192 1024]
-
blk.6.attn_output.weightI8[8192 8192]
-
blk.6.attn_q.weightI8[8192 8192]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ2_K[28672 8192]
-
blk.6.ffn_up.weightI8[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.ffn_gate.weightI8[8192 28672]
-
blk.7.attn_k.weightI8[8192 1024]
-
blk.7.attn_output.weightI8[8192 8192]
-
blk.7.attn_q.weightI8[8192 8192]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ2_K[28672 8192]
-
blk.7.ffn_up.weightI8[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.8.ffn_gate.weightI8[8192 28672]
-
blk.8.attn_k.weightI8[8192 1024]
-
blk.8.attn_output.weightI8[8192 8192]
-
blk.8.attn_q.weightI8[8192 8192]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ2_K[28672 8192]
-
blk.8.ffn_up.weightI8[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.9.ffn_gate.weightI8[8192 28672]
-
blk.9.attn_k.weightI8[8192 1024]
-
blk.9.attn_output.weightI8[8192 8192]
-
blk.9.attn_q.weightI8[8192 8192]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ2_K[28672 8192]
-
blk.9.ffn_up.weightI8[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.10.ffn_gate.weightI8[8192 28672]
-
blk.10.attn_k.weightI8[8192 1024]
-
blk.10.attn_output.weightI8[8192 8192]
-
blk.10.attn_q.weightI8[8192 8192]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightI8[28672 8192]
-
blk.10.ffn_up.weightI8[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.11.ffn_gate.weightI8[8192 28672]
-
blk.11.attn_k.weightI8[8192 1024]
-
blk.11.attn_output.weightI8[8192 8192]
-
blk.11.attn_q.weightI8[8192 8192]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightI8[28672 8192]
-
blk.11.ffn_up.weightI8[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.12.ffn_gate.weightI8[8192 28672]
-
blk.12.attn_k.weightI8[8192 1024]
-
blk.12.attn_output.weightI8[8192 8192]
-
blk.12.attn_q.weightI8[8192 8192]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightI8[28672 8192]
-
blk.12.ffn_up.weightI8[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.ffn_gate.weightI8[8192 28672]
-
blk.13.attn_k.weightI8[8192 1024]
-
blk.13.attn_output.weightI8[8192 8192]
-
blk.13.attn_q.weightI8[8192 8192]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightI8[28672 8192]
-
blk.13.ffn_up.weightI8[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.ffn_gate.weightI8[8192 28672]
-
blk.14.attn_k.weightI8[8192 1024]
-
blk.14.attn_output.weightI8[8192 8192]
-
blk.14.attn_q.weightI8[8192 8192]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightI8[28672 8192]
-
blk.14.ffn_up.weightI8[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.15.ffn_gate.weightI8[8192 28672]
-
blk.15.attn_k.weightI8[8192 1024]
-
blk.15.attn_output.weightI8[8192 8192]
-
blk.15.attn_q.weightI8[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightI8[28672 8192]
-
blk.15.ffn_up.weightI8[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.ffn_gate.weightI8[8192 28672]
-
blk.16.attn_k.weightI8[8192 1024]
-
blk.16.attn_output.weightI8[8192 8192]
-
blk.16.attn_q.weightI8[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightI8[28672 8192]
-
blk.16.ffn_up.weightI8[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.ffn_gate.weightI8[8192 28672]
-
blk.17.attn_k.weightI8[8192 1024]
-
blk.17.attn_output.weightI8[8192 8192]
-
blk.17.attn_q.weightI8[8192 8192]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightI8[28672 8192]
-
blk.17.ffn_up.weightI8[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.18.ffn_gate.weightI8[8192 28672]
-
blk.18.attn_k.weightI8[8192 1024]
-
blk.18.attn_output.weightI8[8192 8192]
-
blk.18.attn_q.weightI8[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightI8[28672 8192]
-
blk.18.ffn_up.weightI8[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.ffn_gate.weightI8[8192 28672]
-
blk.19.attn_k.weightI8[8192 1024]
-
blk.19.attn_output.weightI8[8192 8192]
-
blk.19.attn_q.weightI8[8192 8192]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightI8[28672 8192]
-
blk.19.ffn_up.weightI8[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.ffn_gate.weightI8[8192 28672]
-
blk.20.attn_k.weightI8[8192 1024]
-
blk.20.attn_output.weightI8[8192 8192]
-
blk.20.attn_q.weightI8[8192 8192]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightI8[28672 8192]
-
blk.20.ffn_up.weightI8[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.21.ffn_gate.weightI8[8192 28672]
-
blk.21.attn_k.weightI8[8192 1024]
-
blk.21.attn_output.weightI8[8192 8192]
-
blk.21.attn_q.weightI8[8192 8192]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightI8[28672 8192]
-
blk.21.ffn_up.weightI8[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.22.ffn_gate.weightI8[8192 28672]
-
blk.22.attn_k.weightI8[8192 1024]
-
blk.22.attn_output.weightI8[8192 8192]
-
blk.22.attn_q.weightI8[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightI8[28672 8192]
-
blk.22.ffn_up.weightI8[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.23.ffn_gate.weightI8[8192 28672]
-
blk.23.attn_k.weightI8[8192 1024]
-
blk.23.attn_output.weightI8[8192 8192]
-
blk.23.attn_q.weightI8[8192 8192]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightI8[28672 8192]
-
blk.23.ffn_up.weightI8[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.24.ffn_gate.weightI8[8192 28672]
-
blk.24.attn_k.weightI8[8192 1024]
-
blk.24.attn_output.weightI8[8192 8192]
-
blk.24.attn_q.weightI8[8192 8192]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightI8[28672 8192]
-
blk.24.ffn_up.weightI8[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.25.ffn_gate.weightI8[8192 28672]
-
blk.25.attn_k.weightI8[8192 1024]
-
blk.25.attn_output.weightI8[8192 8192]
-
blk.25.attn_q.weightI8[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightI8[28672 8192]
-
blk.25.ffn_up.weightI8[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.26.ffn_gate.weightI8[8192 28672]
-
blk.26.attn_k.weightI8[8192 1024]
-
blk.26.attn_output.weightI8[8192 8192]
-
blk.26.attn_q.weightI8[8192 8192]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightI8[28672 8192]
-
blk.26.ffn_up.weightI8[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.ffn_gate.weightI8[8192 28672]
-
blk.27.attn_k.weightI8[8192 1024]
-
blk.27.attn_output.weightI8[8192 8192]
-
blk.27.attn_q.weightI8[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightI8[28672 8192]
-
blk.27.ffn_up.weightI8[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.ffn_gate.weightI8[8192 28672]
-
blk.28.attn_k.weightI8[8192 1024]
-
blk.28.attn_output.weightI8[8192 8192]
-
blk.28.attn_q.weightI8[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightI8[28672 8192]
-
blk.28.ffn_up.weightI8[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.29.ffn_gate.weightI8[8192 28672]
-
blk.29.attn_k.weightI8[8192 1024]
-
blk.29.attn_output.weightI8[8192 8192]
-
blk.29.attn_q.weightI8[8192 8192]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightI8[28672 8192]
-
blk.29.ffn_up.weightI8[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.ffn_gate.weightI8[8192 28672]
-
blk.30.attn_k.weightI8[8192 1024]
-
blk.30.attn_output.weightI8[8192 8192]
-
blk.30.attn_q.weightI8[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightI8[28672 8192]
-
blk.30.ffn_up.weightI8[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.ffn_gate.weightI8[8192 28672]
-
blk.31.attn_k.weightI8[8192 1024]
-
blk.31.attn_output.weightI8[8192 8192]
-
blk.31.attn_q.weightI8[8192 8192]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightI8[28672 8192]
-
blk.31.ffn_up.weightI8[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.ffn_gate.weightI8[8192 28672]
-
blk.32.attn_k.weightI8[8192 1024]
-
blk.32.attn_output.weightI8[8192 8192]
-
blk.32.attn_q.weightI8[8192 8192]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightI8[28672 8192]
-
blk.32.ffn_up.weightI8[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.ffn_gate.weightI8[8192 28672]
-
blk.33.attn_k.weightI8[8192 1024]
-
blk.33.attn_output.weightI8[8192 8192]
-
blk.33.attn_q.weightI8[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightI8[28672 8192]
-
blk.33.ffn_up.weightI8[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.ffn_gate.weightI8[8192 28672]
-
blk.34.attn_k.weightI8[8192 1024]
-
blk.34.attn_output.weightI8[8192 8192]
-
blk.34.attn_q.weightI8[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightI8[28672 8192]
-
blk.34.ffn_up.weightI8[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.ffn_gate.weightI8[8192 28672]
-
blk.35.attn_k.weightI8[8192 1024]
-
blk.35.attn_output.weightI8[8192 8192]
-
blk.35.attn_q.weightI8[8192 8192]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightI8[28672 8192]
-
blk.35.ffn_up.weightI8[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.36.ffn_gate.weightI8[8192 28672]
-
blk.36.attn_k.weightI8[8192 1024]
-
blk.36.attn_output.weightI8[8192 8192]
-
blk.36.attn_q.weightI8[8192 8192]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightI8[28672 8192]
-
blk.36.ffn_up.weightI8[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.37.ffn_gate.weightI8[8192 28672]
-
blk.37.attn_k.weightI8[8192 1024]
-
blk.37.attn_output.weightI8[8192 8192]
-
blk.37.attn_q.weightI8[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightI8[28672 8192]
-
blk.37.ffn_up.weightI8[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.38.ffn_gate.weightI8[8192 28672]
-
blk.38.attn_k.weightI8[8192 1024]
-
blk.38.attn_output.weightI8[8192 8192]
-
blk.38.attn_q.weightI8[8192 8192]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightI8[28672 8192]
-
blk.38.ffn_up.weightI8[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.39.ffn_gate.weightI8[8192 28672]
-
blk.39.attn_k.weightI8[8192 1024]
-
blk.39.attn_output.weightI8[8192 8192]
-
blk.39.attn_q.weightI8[8192 8192]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightI8[28672 8192]
-
blk.39.ffn_up.weightI8[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.40.ffn_gate.weightI8[8192 28672]
-
blk.40.attn_k.weightI8[8192 1024]
-
blk.40.attn_output.weightI8[8192 8192]
-
blk.40.attn_q.weightI8[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightI8[28672 8192]
-
blk.40.ffn_up.weightI8[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.ffn_gate.weightI8[8192 28672]
-
blk.41.attn_k.weightI8[8192 1024]
-
blk.41.attn_output.weightI8[8192 8192]
-
blk.41.attn_q.weightI8[8192 8192]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightI8[28672 8192]
-
blk.41.ffn_up.weightI8[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.ffn_gate.weightI8[8192 28672]
-
blk.42.attn_k.weightI8[8192 1024]
-
blk.42.attn_output.weightI8[8192 8192]
-
blk.42.attn_q.weightI8[8192 8192]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightI8[28672 8192]
-
blk.42.ffn_up.weightI8[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.43.ffn_gate.weightI8[8192 28672]
-
blk.43.attn_k.weightI8[8192 1024]
-
blk.43.attn_output.weightI8[8192 8192]
-
blk.43.attn_q.weightI8[8192 8192]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightI8[28672 8192]
-
blk.43.ffn_up.weightI8[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.ffn_gate.weightI8[8192 28672]
-
blk.44.attn_k.weightI8[8192 1024]
-
blk.44.attn_output.weightI8[8192 8192]
-
blk.44.attn_q.weightI8[8192 8192]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightI8[28672 8192]
-
blk.44.ffn_up.weightI8[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.ffn_gate.weightI8[8192 28672]
-
blk.45.attn_k.weightI8[8192 1024]
-
blk.45.attn_output.weightI8[8192 8192]
-
blk.45.attn_q.weightI8[8192 8192]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightI8[28672 8192]
-
blk.45.ffn_up.weightI8[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.46.ffn_gate.weightI8[8192 28672]
-
blk.46.attn_k.weightI8[8192 1024]
-
blk.46.attn_output.weightI8[8192 8192]
-
blk.46.attn_q.weightI8[8192 8192]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightI8[28672 8192]
-
blk.46.ffn_up.weightI8[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.ffn_gate.weightI8[8192 28672]
-
blk.47.attn_k.weightI8[8192 1024]
-
blk.47.attn_output.weightI8[8192 8192]
-
blk.47.attn_q.weightI8[8192 8192]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightI8[28672 8192]
-
blk.47.ffn_up.weightI8[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.ffn_gate.weightI8[8192 28672]
-
blk.48.attn_k.weightI8[8192 1024]
-
blk.48.attn_output.weightI8[8192 8192]
-
blk.48.attn_q.weightI8[8192 8192]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightI8[28672 8192]
-
blk.48.ffn_up.weightI8[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.49.ffn_gate.weightI8[8192 28672]
-
blk.49.attn_k.weightI8[8192 1024]
-
blk.49.attn_output.weightI8[8192 8192]
-
blk.49.attn_q.weightI8[8192 8192]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightI8[28672 8192]
-
blk.49.ffn_up.weightI8[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.50.ffn_gate.weightI8[8192 28672]
-
blk.50.attn_k.weightI8[8192 1024]
-
blk.50.attn_output.weightI8[8192 8192]
-
blk.50.attn_q.weightI8[8192 8192]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightI8[28672 8192]
-
blk.50.ffn_up.weightI8[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.ffn_gate.weightI8[8192 28672]
-
blk.51.attn_k.weightI8[8192 1024]
-
blk.51.attn_output.weightI8[8192 8192]
-
blk.51.attn_q.weightI8[8192 8192]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightI8[28672 8192]
-
blk.51.ffn_up.weightI8[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.52.ffn_gate.weightI8[8192 28672]
-
blk.52.attn_k.weightI8[8192 1024]
-
blk.52.attn_output.weightI8[8192 8192]
-
blk.52.attn_q.weightI8[8192 8192]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightI8[28672 8192]
-
blk.52.ffn_up.weightI8[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.53.ffn_gate.weightI8[8192 28672]
-
blk.53.attn_k.weightI8[8192 1024]
-
blk.53.attn_output.weightI8[8192 8192]
-
blk.53.attn_q.weightI8[8192 8192]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightI8[28672 8192]
-
blk.53.ffn_up.weightI8[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.54.ffn_gate.weightI8[8192 28672]
-
blk.54.attn_k.weightI8[8192 1024]
-
blk.54.attn_output.weightI8[8192 8192]
-
blk.54.attn_q.weightI8[8192 8192]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightI8[28672 8192]
-
blk.54.ffn_up.weightI8[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.ffn_gate.weightI8[8192 28672]
-
blk.55.attn_k.weightI8[8192 1024]
-
blk.55.attn_output.weightI8[8192 8192]
-
blk.55.attn_q.weightI8[8192 8192]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightI8[28672 8192]
-
blk.55.ffn_up.weightI8[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.ffn_gate.weightI8[8192 28672]
-
blk.56.attn_k.weightI8[8192 1024]
-
blk.56.attn_output.weightI8[8192 8192]
-
blk.56.attn_q.weightI8[8192 8192]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightI8[28672 8192]
-
blk.56.ffn_up.weightI8[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.57.ffn_gate.weightI8[8192 28672]
-
blk.57.attn_k.weightI8[8192 1024]
-
blk.57.attn_output.weightI8[8192 8192]
-
blk.57.attn_q.weightI8[8192 8192]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightI8[28672 8192]
-
blk.57.ffn_up.weightI8[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.ffn_gate.weightI8[8192 28672]
-
blk.58.attn_k.weightI8[8192 1024]
-
blk.58.attn_output.weightI8[8192 8192]
-
blk.58.attn_q.weightI8[8192 8192]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightI8[28672 8192]
-
blk.58.ffn_up.weightI8[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.ffn_gate.weightI8[8192 28672]
-
blk.59.attn_k.weightI8[8192 1024]
-
blk.59.attn_output.weightI8[8192 8192]
-
blk.59.attn_q.weightI8[8192 8192]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightI8[28672 8192]
-
blk.59.ffn_up.weightI8[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.60.ffn_gate.weightI8[8192 28672]
-
blk.60.attn_k.weightI8[8192 1024]
-
blk.60.attn_output.weightI8[8192 8192]
-
blk.60.attn_q.weightI8[8192 8192]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightI8[28672 8192]
-
blk.60.ffn_up.weightI8[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.ffn_gate.weightI8[8192 28672]
-
blk.61.attn_k.weightI8[8192 1024]
-
blk.61.attn_output.weightI8[8192 8192]
-
blk.61.attn_q.weightI8[8192 8192]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightI8[28672 8192]
-
blk.61.ffn_up.weightI8[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.ffn_gate.weightI8[8192 28672]
-
blk.62.attn_k.weightI8[8192 1024]
-
blk.62.attn_output.weightI8[8192 8192]
-
blk.62.attn_q.weightI8[8192 8192]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightI8[28672 8192]
-
blk.62.ffn_up.weightI8[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.63.ffn_gate.weightI8[8192 28672]
-
blk.63.attn_k.weightI8[8192 1024]
-
blk.63.attn_output.weightI8[8192 8192]
-
blk.63.attn_q.weightI8[8192 8192]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightI8[28672 8192]
-
blk.63.ffn_up.weightI8[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.64.ffn_gate.weightI8[8192 28672]
-
blk.64.attn_k.weightI8[8192 1024]
-
blk.64.attn_output.weightI8[8192 8192]
-
blk.64.attn_q.weightI8[8192 8192]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightI8[28672 8192]
-
blk.64.ffn_up.weightI8[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.65.ffn_gate.weightI8[8192 28672]
-
blk.65.attn_k.weightI8[8192 1024]
-
blk.65.attn_output.weightI8[8192 8192]
-
blk.65.attn_q.weightI8[8192 8192]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightI8[28672 8192]
-
blk.65.ffn_up.weightI8[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.66.ffn_gate.weightI8[8192 28672]
-
blk.66.attn_k.weightI8[8192 1024]
-
blk.66.attn_output.weightI8[8192 8192]
-
blk.66.attn_q.weightI8[8192 8192]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightI8[28672 8192]
-
blk.66.ffn_up.weightI8[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.67.ffn_gate.weightI8[8192 28672]
-
blk.67.attn_k.weightI8[8192 1024]
-
blk.67.attn_output.weightI8[8192 8192]
-
blk.67.attn_q.weightI8[8192 8192]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightI8[28672 8192]
-
blk.67.ffn_up.weightI8[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.ffn_gate.weightI8[8192 28672]
-
blk.68.attn_k.weightI8[8192 1024]
-
blk.68.attn_output.weightI8[8192 8192]
-
blk.68.attn_q.weightI8[8192 8192]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightI8[28672 8192]
-
blk.68.ffn_up.weightI8[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.ffn_gate.weightI8[8192 28672]
-
blk.69.attn_k.weightI8[8192 1024]
-
blk.69.attn_output.weightI8[8192 8192]
-
blk.69.attn_q.weightI8[8192 8192]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightI8[28672 8192]
-
blk.69.ffn_up.weightI8[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.70.ffn_gate.weightI8[8192 28672]
-
blk.70.attn_k.weightI8[8192 1024]
-
blk.70.attn_output.weightI8[8192 8192]
-
blk.70.attn_q.weightI8[8192 8192]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightI8[28672 8192]
-
blk.70.ffn_up.weightI8[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.71.ffn_gate.weightI8[8192 28672]
-
blk.71.attn_k.weightI8[8192 1024]
-
blk.71.attn_output.weightI8[8192 8192]
-
blk.71.attn_q.weightI8[8192 8192]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightI8[28672 8192]
-
blk.71.ffn_up.weightI8[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.ffn_gate.weightI8[8192 28672]
-
blk.72.attn_k.weightI8[8192 1024]
-
blk.72.attn_output.weightI8[8192 8192]
-
blk.72.attn_q.weightI8[8192 8192]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightI8[28672 8192]
-
blk.72.ffn_up.weightI8[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.ffn_gate.weightI8[8192 28672]
-
blk.73.attn_k.weightI8[8192 1024]
-
blk.73.attn_output.weightI8[8192 8192]
-
blk.73.attn_q.weightI8[8192 8192]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightI8[28672 8192]
-
blk.73.ffn_up.weightI8[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.74.ffn_gate.weightI8[8192 28672]
-
blk.74.attn_k.weightI8[8192 1024]
-
blk.74.attn_output.weightI8[8192 8192]
-
blk.74.attn_q.weightI8[8192 8192]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightI8[28672 8192]
-
blk.74.ffn_up.weightI8[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.ffn_gate.weightI8[8192 28672]
-
blk.75.attn_k.weightI8[8192 1024]
-
blk.75.attn_output.weightI8[8192 8192]
-
blk.75.attn_q.weightI8[8192 8192]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightI8[28672 8192]
-
blk.75.ffn_up.weightI8[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.ffn_gate.weightI8[8192 28672]
-
blk.76.attn_k.weightI8[8192 1024]
-
blk.76.attn_output.weightI8[8192 8192]
-
blk.76.attn_q.weightI8[8192 8192]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightI8[28672 8192]
-
blk.76.ffn_up.weightI8[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.77.ffn_gate.weightI8[8192 28672]
-
blk.77.attn_k.weightI8[8192 1024]
-
blk.77.attn_output.weightI8[8192 8192]
-
blk.77.attn_q.weightI8[8192 8192]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightI8[28672 8192]
-
blk.77.ffn_up.weightI8[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.78.ffn_gate.weightI8[8192 28672]
-
blk.78.attn_k.weightI8[8192 1024]
-
blk.78.attn_output.weightI8[8192 8192]
-
blk.78.attn_q.weightI8[8192 8192]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightI8[28672 8192]
-
blk.78.ffn_up.weightI8[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.ffn_gate.weightI8[8192 28672]
-
blk.79.attn_k.weightI8[8192 1024]
-
blk.79.attn_output.weightI8[8192 8192]
-
blk.79.attn_q.weightI8[8192 8192]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightI8[28672 8192]
-
blk.79.ffn_up.weightI8[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
output_norm.weightF32[8192]
-
output.weightQ5_K[8192 128262]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79