https://huggingface.co/mradermacher/Tess-70B-v1.6-GGUF
70B
38 Pulls Updated 6 months ago
ea94a4a00ab0 · 48GB
-
general.architecturellama
-
general.file_typeQ5_K_S
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length32764
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ5_K[8192 32001]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ5_K[28672 8192]
-
blk.0.ffn_gate.weightQ5_K[8192 28672]
-
blk.0.ffn_up.weightQ5_K[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ5_K[8192 1024]
-
blk.0.attn_output.weightQ5_K[8192 8192]
-
blk.0.attn_q.weightQ5_K[8192 8192]
-
blk.0.attn_v.weightQ5_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ5_K[28672 8192]
-
blk.1.ffn_gate.weightQ5_K[8192 28672]
-
blk.1.ffn_up.weightQ5_K[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ5_K[8192 1024]
-
blk.1.attn_output.weightQ5_K[8192 8192]
-
blk.1.attn_q.weightQ5_K[8192 8192]
-
blk.1.attn_v.weightQ5_K[8192 1024]
-
blk.2.ffn_gate.weightQ5_K[8192 28672]
-
blk.2.attn_k.weightQ5_K[8192 1024]
-
blk.2.attn_output.weightQ5_K[8192 8192]
-
blk.2.attn_q.weightQ5_K[8192 8192]
-
blk.2.attn_v.weightQ5_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ5_K[28672 8192]
-
blk.2.ffn_up.weightQ5_K[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ5_K[28672 8192]
-
blk.3.ffn_gate.weightQ5_K[8192 28672]
-
blk.3.ffn_up.weightQ5_K[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ5_K[8192 1024]
-
blk.3.attn_output.weightQ5_K[8192 8192]
-
blk.3.attn_q.weightQ5_K[8192 8192]
-
blk.3.attn_v.weightQ5_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ5_K[28672 8192]
-
blk.4.ffn_gate.weightQ5_K[8192 28672]
-
blk.4.ffn_up.weightQ5_K[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ5_K[8192 1024]
-
blk.4.attn_output.weightQ5_K[8192 8192]
-
blk.4.attn_q.weightQ5_K[8192 8192]
-
blk.4.attn_v.weightQ5_K[8192 1024]
-
blk.5.attn_k.weightQ5_K[8192 1024]
-
blk.5.attn_output.weightQ5_K[8192 8192]
-
blk.5.attn_q.weightQ5_K[8192 8192]
-
blk.5.attn_v.weightQ5_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ5_K[28672 8192]
-
blk.5.ffn_gate.weightQ5_K[8192 28672]
-
blk.5.ffn_up.weightQ5_K[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ5_K[28672 8192]
-
blk.6.ffn_gate.weightQ5_K[8192 28672]
-
blk.6.ffn_up.weightQ5_K[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ5_K[8192 1024]
-
blk.6.attn_output.weightQ5_K[8192 8192]
-
blk.6.attn_q.weightQ5_K[8192 8192]
-
blk.6.attn_v.weightQ5_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ5_K[28672 8192]
-
blk.7.ffn_gate.weightQ5_K[8192 28672]
-
blk.7.ffn_up.weightQ5_K[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ5_K[8192 1024]
-
blk.7.attn_output.weightQ5_K[8192 8192]
-
blk.7.attn_q.weightQ5_K[8192 8192]
-
blk.7.attn_v.weightQ5_K[8192 1024]
-
blk.8.attn_k.weightQ5_K[8192 1024]
-
blk.8.attn_q.weightQ5_K[8192 8192]
-
blk.8.attn_v.weightQ5_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ5_K[28672 8192]
-
blk.8.ffn_gate.weightQ5_K[8192 28672]
-
blk.8.ffn_up.weightQ5_K[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_output.weightQ5_K[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ5_K[28672 8192]
-
blk.9.ffn_gate.weightQ5_K[8192 28672]
-
blk.9.ffn_up.weightQ5_K[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ5_K[8192 1024]
-
blk.9.attn_output.weightQ5_K[8192 8192]
-
blk.9.attn_q.weightQ5_K[8192 8192]
-
blk.9.attn_v.weightQ5_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ5_K[28672 8192]
-
blk.10.ffn_gate.weightQ5_K[8192 28672]
-
blk.10.ffn_up.weightQ5_K[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ5_K[8192 1024]
-
blk.10.attn_output.weightQ5_K[8192 8192]
-
blk.10.attn_q.weightQ5_K[8192 8192]
-
blk.10.attn_v.weightQ5_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ5_K[28672 8192]
-
blk.11.ffn_gate.weightQ5_K[8192 28672]
-
blk.11.ffn_up.weightQ5_K[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ5_K[8192 1024]
-
blk.11.attn_output.weightQ5_K[8192 8192]
-
blk.11.attn_q.weightQ5_K[8192 8192]
-
blk.11.attn_v.weightQ5_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ5_K[28672 8192]
-
blk.12.ffn_gate.weightQ5_K[8192 28672]
-
blk.12.ffn_up.weightQ5_K[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ5_K[8192 1024]
-
blk.12.attn_output.weightQ5_K[8192 8192]
-
blk.12.attn_q.weightQ5_K[8192 8192]
-
blk.12.attn_v.weightQ5_K[8192 1024]
-
blk.13.ffn_gate.weightQ5_K[8192 28672]
-
blk.13.ffn_up.weightQ5_K[8192 28672]
-
blk.13.attn_k.weightQ5_K[8192 1024]
-
blk.13.attn_output.weightQ5_K[8192 8192]
-
blk.13.attn_q.weightQ5_K[8192 8192]
-
blk.13.attn_v.weightQ5_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ5_K[28672 8192]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ5_K[28672 8192]
-
blk.14.ffn_gate.weightQ5_K[8192 28672]
-
blk.14.ffn_up.weightQ5_K[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ5_K[8192 1024]
-
blk.14.attn_output.weightQ5_K[8192 8192]
-
blk.14.attn_q.weightQ5_K[8192 8192]
-
blk.14.attn_v.weightQ5_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ5_K[28672 8192]
-
blk.15.ffn_gate.weightQ5_K[8192 28672]
-
blk.15.ffn_up.weightQ5_K[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ5_K[8192 1024]
-
blk.15.attn_output.weightQ5_K[8192 8192]
-
blk.15.attn_q.weightQ5_K[8192 8192]
-
blk.15.attn_v.weightQ5_K[8192 1024]
-
blk.16.ffn_gate.weightQ5_K[8192 28672]
-
blk.16.attn_k.weightQ5_K[8192 1024]
-
blk.16.attn_output.weightQ5_K[8192 8192]
-
blk.16.attn_q.weightQ5_K[8192 8192]
-
blk.16.attn_v.weightQ5_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ5_K[28672 8192]
-
blk.16.ffn_up.weightQ5_K[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ5_K[28672 8192]
-
blk.17.ffn_gate.weightQ5_K[8192 28672]
-
blk.17.ffn_up.weightQ5_K[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ5_K[8192 1024]
-
blk.17.attn_output.weightQ5_K[8192 8192]
-
blk.17.attn_q.weightQ5_K[8192 8192]
-
blk.17.attn_v.weightQ5_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ5_K[28672 8192]
-
blk.18.ffn_gate.weightQ5_K[8192 28672]
-
blk.18.ffn_up.weightQ5_K[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ5_K[8192 1024]
-
blk.18.attn_output.weightQ5_K[8192 8192]
-
blk.18.attn_q.weightQ5_K[8192 8192]
-
blk.18.attn_v.weightQ5_K[8192 1024]
-
blk.19.attn_k.weightQ5_K[8192 1024]
-
blk.19.attn_output.weightQ5_K[8192 8192]
-
blk.19.attn_q.weightQ5_K[8192 8192]
-
blk.19.attn_v.weightQ5_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ5_K[28672 8192]
-
blk.19.ffn_gate.weightQ5_K[8192 28672]
-
blk.19.ffn_up.weightQ5_K[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ5_K[28672 8192]
-
blk.20.ffn_gate.weightQ5_K[8192 28672]
-
blk.20.ffn_up.weightQ5_K[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ5_K[8192 1024]
-
blk.20.attn_output.weightQ5_K[8192 8192]
-
blk.20.attn_q.weightQ5_K[8192 8192]
-
blk.20.attn_v.weightQ5_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ5_K[28672 8192]
-
blk.21.ffn_gate.weightQ5_K[8192 28672]
-
blk.21.ffn_up.weightQ5_K[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ5_K[8192 1024]
-
blk.21.attn_output.weightQ5_K[8192 8192]
-
blk.21.attn_q.weightQ5_K[8192 8192]
-
blk.21.attn_v.weightQ5_K[8192 1024]
-
blk.22.attn_k.weightQ5_K[8192 1024]
-
blk.22.attn_q.weightQ5_K[8192 8192]
-
blk.22.attn_v.weightQ5_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ5_K[28672 8192]
-
blk.22.ffn_gate.weightQ5_K[8192 28672]
-
blk.22.ffn_up.weightQ5_K[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_output.weightQ5_K[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ5_K[28672 8192]
-
blk.23.ffn_gate.weightQ5_K[8192 28672]
-
blk.23.ffn_up.weightQ5_K[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ5_K[8192 1024]
-
blk.23.attn_output.weightQ5_K[8192 8192]
-
blk.23.attn_q.weightQ5_K[8192 8192]
-
blk.23.attn_v.weightQ5_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ5_K[28672 8192]
-
blk.24.ffn_gate.weightQ5_K[8192 28672]
-
blk.24.ffn_up.weightQ5_K[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ5_K[8192 1024]
-
blk.24.attn_output.weightQ5_K[8192 8192]
-
blk.24.attn_q.weightQ5_K[8192 8192]
-
blk.24.attn_v.weightQ5_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ5_K[28672 8192]
-
blk.25.ffn_gate.weightQ5_K[8192 28672]
-
blk.25.ffn_up.weightQ5_K[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ5_K[8192 1024]
-
blk.25.attn_output.weightQ5_K[8192 8192]
-
blk.25.attn_q.weightQ5_K[8192 8192]
-
blk.25.attn_v.weightQ5_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ5_K[28672 8192]
-
blk.26.ffn_gate.weightQ5_K[8192 28672]
-
blk.26.ffn_up.weightQ5_K[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ5_K[8192 1024]
-
blk.26.attn_output.weightQ5_K[8192 8192]
-
blk.26.attn_q.weightQ5_K[8192 8192]
-
blk.26.attn_v.weightQ5_K[8192 1024]
-
blk.27.ffn_gate.weightQ5_K[8192 28672]
-
blk.27.ffn_up.weightQ5_K[8192 28672]
-
blk.27.attn_k.weightQ5_K[8192 1024]
-
blk.27.attn_output.weightQ5_K[8192 8192]
-
blk.27.attn_q.weightQ5_K[8192 8192]
-
blk.27.attn_v.weightQ5_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ5_K[28672 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ5_K[28672 8192]
-
blk.28.ffn_gate.weightQ5_K[8192 28672]
-
blk.28.ffn_up.weightQ5_K[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ5_K[8192 1024]
-
blk.28.attn_output.weightQ5_K[8192 8192]
-
blk.28.attn_q.weightQ5_K[8192 8192]
-
blk.28.attn_v.weightQ5_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ5_K[28672 8192]
-
blk.29.ffn_gate.weightQ5_K[8192 28672]
-
blk.29.ffn_up.weightQ5_K[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ5_K[8192 1024]
-
blk.29.attn_output.weightQ5_K[8192 8192]
-
blk.29.attn_q.weightQ5_K[8192 8192]
-
blk.29.attn_v.weightQ5_K[8192 1024]
-
blk.30.ffn_gate.weightQ5_K[8192 28672]
-
blk.30.attn_k.weightQ5_K[8192 1024]
-
blk.30.attn_output.weightQ5_K[8192 8192]
-
blk.30.attn_q.weightQ5_K[8192 8192]
-
blk.30.attn_v.weightQ5_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ5_K[28672 8192]
-
blk.30.ffn_up.weightQ5_K[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ5_K[28672 8192]
-
blk.31.ffn_gate.weightQ5_K[8192 28672]
-
blk.31.ffn_up.weightQ5_K[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ5_K[8192 1024]
-
blk.31.attn_output.weightQ5_K[8192 8192]
-
blk.31.attn_q.weightQ5_K[8192 8192]
-
blk.31.attn_v.weightQ5_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ5_K[28672 8192]
-
blk.32.ffn_gate.weightQ5_K[8192 28672]
-
blk.32.ffn_up.weightQ5_K[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ5_K[8192 1024]
-
blk.32.attn_output.weightQ5_K[8192 8192]
-
blk.32.attn_q.weightQ5_K[8192 8192]
-
blk.32.attn_v.weightQ5_K[8192 1024]
-
blk.33.attn_k.weightQ5_K[8192 1024]
-
blk.33.attn_output.weightQ5_K[8192 8192]
-
blk.33.attn_q.weightQ5_K[8192 8192]
-
blk.33.attn_v.weightQ5_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ5_K[28672 8192]
-
blk.33.ffn_gate.weightQ5_K[8192 28672]
-
blk.33.ffn_up.weightQ5_K[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ5_K[28672 8192]
-
blk.34.ffn_gate.weightQ5_K[8192 28672]
-
blk.34.ffn_up.weightQ5_K[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ5_K[8192 1024]
-
blk.34.attn_output.weightQ5_K[8192 8192]
-
blk.34.attn_q.weightQ5_K[8192 8192]
-
blk.34.attn_v.weightQ5_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ5_K[28672 8192]
-
blk.35.ffn_gate.weightQ5_K[8192 28672]
-
blk.35.ffn_up.weightQ5_K[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ5_K[8192 1024]
-
blk.35.attn_output.weightQ5_K[8192 8192]
-
blk.35.attn_q.weightQ5_K[8192 8192]
-
blk.35.attn_v.weightQ5_K[8192 1024]
-
blk.36.attn_k.weightQ5_K[8192 1024]
-
blk.36.attn_q.weightQ5_K[8192 8192]
-
blk.36.attn_v.weightQ5_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ5_K[28672 8192]
-
blk.36.ffn_gate.weightQ5_K[8192 28672]
-
blk.36.ffn_up.weightQ5_K[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_output.weightQ5_K[8192 8192]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ5_K[28672 8192]
-
blk.37.ffn_gate.weightQ5_K[8192 28672]
-
blk.37.ffn_up.weightQ5_K[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ5_K[8192 1024]
-
blk.37.attn_output.weightQ5_K[8192 8192]
-
blk.37.attn_q.weightQ5_K[8192 8192]
-
blk.37.attn_v.weightQ5_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ5_K[28672 8192]
-
blk.38.ffn_gate.weightQ5_K[8192 28672]
-
blk.38.ffn_up.weightQ5_K[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ5_K[8192 1024]
-
blk.38.attn_output.weightQ5_K[8192 8192]
-
blk.38.attn_q.weightQ5_K[8192 8192]
-
blk.38.attn_v.weightQ5_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ5_K[28672 8192]
-
blk.39.ffn_gate.weightQ5_K[8192 28672]
-
blk.39.ffn_up.weightQ5_K[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ5_K[8192 1024]
-
blk.39.attn_output.weightQ5_K[8192 8192]
-
blk.39.attn_q.weightQ5_K[8192 8192]
-
blk.39.attn_v.weightQ5_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ5_K[28672 8192]
-
blk.40.ffn_gate.weightQ5_K[8192 28672]
-
blk.40.ffn_up.weightQ5_K[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ5_K[8192 1024]
-
blk.40.attn_output.weightQ5_K[8192 8192]
-
blk.40.attn_q.weightQ5_K[8192 8192]
-
blk.40.attn_v.weightQ5_K[8192 1024]
-
blk.41.ffn_gate.weightQ5_K[8192 28672]
-
blk.41.ffn_up.weightQ5_K[8192 28672]
-
blk.41.attn_k.weightQ5_K[8192 1024]
-
blk.41.attn_output.weightQ5_K[8192 8192]
-
blk.41.attn_q.weightQ5_K[8192 8192]
-
blk.41.attn_v.weightQ5_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ5_K[28672 8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ5_K[28672 8192]
-
blk.42.ffn_gate.weightQ5_K[8192 28672]
-
blk.42.ffn_up.weightQ5_K[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ5_K[8192 1024]
-
blk.42.attn_output.weightQ5_K[8192 8192]
-
blk.42.attn_q.weightQ5_K[8192 8192]
-
blk.42.attn_v.weightQ5_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ5_K[28672 8192]
-
blk.43.ffn_gate.weightQ5_K[8192 28672]
-
blk.43.ffn_up.weightQ5_K[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ5_K[8192 1024]
-
blk.43.attn_output.weightQ5_K[8192 8192]
-
blk.43.attn_q.weightQ5_K[8192 8192]
-
blk.43.attn_v.weightQ5_K[8192 1024]
-
blk.44.ffn_gate.weightQ5_K[8192 28672]
-
blk.44.attn_k.weightQ5_K[8192 1024]
-
blk.44.attn_output.weightQ5_K[8192 8192]
-
blk.44.attn_q.weightQ5_K[8192 8192]
-
blk.44.attn_v.weightQ5_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ5_K[28672 8192]
-
blk.44.ffn_up.weightQ5_K[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ5_K[28672 8192]
-
blk.45.ffn_gate.weightQ5_K[8192 28672]
-
blk.45.ffn_up.weightQ5_K[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ5_K[8192 1024]
-
blk.45.attn_output.weightQ5_K[8192 8192]
-
blk.45.attn_q.weightQ5_K[8192 8192]
-
blk.45.attn_v.weightQ5_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ5_K[28672 8192]
-
blk.46.ffn_gate.weightQ5_K[8192 28672]
-
blk.46.ffn_up.weightQ5_K[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ5_K[8192 1024]
-
blk.46.attn_output.weightQ5_K[8192 8192]
-
blk.46.attn_q.weightQ5_K[8192 8192]
-
blk.46.attn_v.weightQ5_K[8192 1024]
-
blk.47.attn_k.weightQ5_K[8192 1024]
-
blk.47.attn_output.weightQ5_K[8192 8192]
-
blk.47.attn_q.weightQ5_K[8192 8192]
-
blk.47.attn_v.weightQ5_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ5_K[28672 8192]
-
blk.47.ffn_gate.weightQ5_K[8192 28672]
-
blk.47.ffn_up.weightQ5_K[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ5_K[28672 8192]
-
blk.48.ffn_gate.weightQ5_K[8192 28672]
-
blk.48.ffn_up.weightQ5_K[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ5_K[8192 1024]
-
blk.48.attn_output.weightQ5_K[8192 8192]
-
blk.48.attn_q.weightQ5_K[8192 8192]
-
blk.48.attn_v.weightQ5_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ5_K[28672 8192]
-
blk.49.ffn_gate.weightQ5_K[8192 28672]
-
blk.49.ffn_up.weightQ5_K[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.weightQ5_K[8192 1024]
-
blk.49.attn_output.weightQ5_K[8192 8192]
-
blk.49.attn_q.weightQ5_K[8192 8192]
-
blk.49.attn_v.weightQ5_K[8192 1024]
-
blk.50.attn_k.weightQ5_K[8192 1024]
-
blk.50.attn_q.weightQ5_K[8192 8192]
-
blk.50.attn_v.weightQ5_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ5_K[28672 8192]
-
blk.50.ffn_gate.weightQ5_K[8192 28672]
-
blk.50.ffn_up.weightQ5_K[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_output.weightQ5_K[8192 8192]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ5_K[28672 8192]
-
blk.51.ffn_gate.weightQ5_K[8192 28672]
-
blk.51.ffn_up.weightQ5_K[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ5_K[8192 1024]
-
blk.51.attn_output.weightQ5_K[8192 8192]
-
blk.51.attn_q.weightQ5_K[8192 8192]
-
blk.51.attn_v.weightQ5_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ5_K[28672 8192]
-
blk.52.ffn_gate.weightQ5_K[8192 28672]
-
blk.52.ffn_up.weightQ5_K[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ5_K[8192 1024]
-
blk.52.attn_output.weightQ5_K[8192 8192]
-
blk.52.attn_q.weightQ5_K[8192 8192]
-
blk.52.attn_v.weightQ5_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ5_K[28672 8192]
-
blk.53.ffn_gate.weightQ5_K[8192 28672]
-
blk.53.ffn_up.weightQ5_K[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ5_K[8192 1024]
-
blk.53.attn_output.weightQ5_K[8192 8192]
-
blk.53.attn_q.weightQ5_K[8192 8192]
-
blk.53.attn_v.weightQ5_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ5_K[28672 8192]
-
blk.54.ffn_gate.weightQ5_K[8192 28672]
-
blk.54.ffn_up.weightQ5_K[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.weightQ5_K[8192 1024]
-
blk.54.attn_output.weightQ5_K[8192 8192]
-
blk.54.attn_q.weightQ5_K[8192 8192]
-
blk.54.attn_v.weightQ5_K[8192 1024]
-
blk.55.ffn_gate.weightQ5_K[8192 28672]
-
blk.55.ffn_up.weightQ5_K[8192 28672]
-
blk.55.attn_k.weightQ5_K[8192 1024]
-
blk.55.attn_output.weightQ5_K[8192 8192]
-
blk.55.attn_q.weightQ5_K[8192 8192]
-
blk.55.attn_v.weightQ5_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ5_K[28672 8192]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ5_K[28672 8192]
-
blk.56.ffn_gate.weightQ5_K[8192 28672]
-
blk.56.ffn_up.weightQ5_K[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ5_K[8192 1024]
-
blk.56.attn_output.weightQ5_K[8192 8192]
-
blk.56.attn_q.weightQ5_K[8192 8192]
-
blk.56.attn_v.weightQ5_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ5_K[28672 8192]
-
blk.57.ffn_gate.weightQ5_K[8192 28672]
-
blk.57.ffn_up.weightQ5_K[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.weightQ5_K[8192 1024]
-
blk.57.attn_output.weightQ5_K[8192 8192]
-
blk.57.attn_q.weightQ5_K[8192 8192]
-
blk.57.attn_v.weightQ5_K[8192 1024]
-
blk.58.ffn_gate.weightQ5_K[8192 28672]
-
blk.58.attn_k.weightQ5_K[8192 1024]
-
blk.58.attn_output.weightQ5_K[8192 8192]
-
blk.58.attn_q.weightQ5_K[8192 8192]
-
blk.58.attn_v.weightQ5_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ5_K[28672 8192]
-
blk.58.ffn_up.weightQ5_K[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ5_K[28672 8192]
-
blk.59.ffn_gate.weightQ5_K[8192 28672]
-
blk.59.ffn_up.weightQ5_K[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ5_K[8192 1024]
-
blk.59.attn_output.weightQ5_K[8192 8192]
-
blk.59.attn_q.weightQ5_K[8192 8192]
-
blk.59.attn_v.weightQ5_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ5_K[28672 8192]
-
blk.60.ffn_gate.weightQ5_K[8192 28672]
-
blk.60.ffn_up.weightQ5_K[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.weightQ5_K[8192 1024]
-
blk.60.attn_output.weightQ5_K[8192 8192]
-
blk.60.attn_q.weightQ5_K[8192 8192]
-
blk.60.attn_v.weightQ5_K[8192 1024]
-
blk.61.attn_k.weightQ5_K[8192 1024]
-
blk.61.attn_output.weightQ5_K[8192 8192]
-
blk.61.attn_q.weightQ5_K[8192 8192]
-
blk.61.attn_v.weightQ5_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ5_K[28672 8192]
-
blk.61.ffn_gate.weightQ5_K[8192 28672]
-
blk.61.ffn_up.weightQ5_K[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ5_K[28672 8192]
-
blk.62.ffn_gate.weightQ5_K[8192 28672]
-
blk.62.ffn_up.weightQ5_K[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ5_K[8192 1024]
-
blk.62.attn_output.weightQ5_K[8192 8192]
-
blk.62.attn_q.weightQ5_K[8192 8192]
-
blk.62.attn_v.weightQ5_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ5_K[28672 8192]
-
blk.63.ffn_gate.weightQ5_K[8192 28672]
-
blk.63.ffn_up.weightQ5_K[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.weightQ5_K[8192 1024]
-
blk.63.attn_output.weightQ5_K[8192 8192]
-
blk.63.attn_q.weightQ5_K[8192 8192]
-
blk.63.attn_v.weightQ5_K[8192 1024]
-
blk.64.attn_k.weightQ5_K[8192 1024]
-
blk.64.attn_q.weightQ5_K[8192 8192]
-
blk.64.attn_v.weightQ5_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ5_K[28672 8192]
-
blk.64.ffn_gate.weightQ5_K[8192 28672]
-
blk.64.ffn_up.weightQ5_K[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_output.weightQ5_K[8192 8192]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ5_K[28672 8192]
-
blk.65.ffn_gate.weightQ5_K[8192 28672]
-
blk.65.ffn_up.weightQ5_K[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ5_K[8192 1024]
-
blk.65.attn_output.weightQ5_K[8192 8192]
-
blk.65.attn_q.weightQ5_K[8192 8192]
-
blk.65.attn_v.weightQ5_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ5_K[28672 8192]
-
blk.66.ffn_gate.weightQ5_K[8192 28672]
-
blk.66.ffn_up.weightQ5_K[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ5_K[8192 1024]
-
blk.66.attn_output.weightQ5_K[8192 8192]
-
blk.66.attn_q.weightQ5_K[8192 8192]
-
blk.66.attn_v.weightQ5_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ5_K[28672 8192]
-
blk.67.ffn_gate.weightQ5_K[8192 28672]
-
blk.67.ffn_up.weightQ5_K[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ5_K[8192 1024]
-
blk.67.attn_output.weightQ5_K[8192 8192]
-
blk.67.attn_q.weightQ5_K[8192 8192]
-
blk.67.attn_v.weightQ5_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ5_K[28672 8192]
-
blk.68.ffn_gate.weightQ5_K[8192 28672]
-
blk.68.ffn_up.weightQ5_K[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.weightQ5_K[8192 1024]
-
blk.68.attn_output.weightQ5_K[8192 8192]
-
blk.68.attn_q.weightQ5_K[8192 8192]
-
blk.68.attn_v.weightQ5_K[8192 1024]
-
blk.69.ffn_gate.weightQ5_K[8192 28672]
-
blk.69.ffn_up.weightQ5_K[8192 28672]
-
blk.69.attn_k.weightQ5_K[8192 1024]
-
blk.69.attn_output.weightQ5_K[8192 8192]
-
blk.69.attn_q.weightQ5_K[8192 8192]
-
blk.69.attn_v.weightQ5_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ5_K[28672 8192]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ5_K[28672 8192]
-
blk.70.ffn_gate.weightQ5_K[8192 28672]
-
blk.70.ffn_up.weightQ5_K[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ5_K[8192 1024]
-
blk.70.attn_output.weightQ5_K[8192 8192]
-
blk.70.attn_q.weightQ5_K[8192 8192]
-
blk.70.attn_v.weightQ5_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ5_K[28672 8192]
-
blk.71.ffn_gate.weightQ5_K[8192 28672]
-
blk.71.ffn_up.weightQ5_K[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.weightQ5_K[8192 1024]
-
blk.71.attn_output.weightQ5_K[8192 8192]
-
blk.71.attn_q.weightQ5_K[8192 8192]
-
blk.71.attn_v.weightQ5_K[8192 1024]
-
blk.72.ffn_gate.weightQ5_K[8192 28672]
-
blk.72.attn_k.weightQ5_K[8192 1024]
-
blk.72.attn_output.weightQ5_K[8192 8192]
-
blk.72.attn_q.weightQ5_K[8192 8192]
-
blk.72.attn_v.weightQ5_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ5_K[28672 8192]
-
blk.72.ffn_up.weightQ5_K[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ5_K[28672 8192]
-
blk.73.ffn_gate.weightQ5_K[8192 28672]
-
blk.73.ffn_up.weightQ5_K[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ5_K[8192 1024]
-
blk.73.attn_output.weightQ5_K[8192 8192]
-
blk.73.attn_q.weightQ5_K[8192 8192]
-
blk.73.attn_v.weightQ5_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ5_K[28672 8192]
-
blk.74.ffn_gate.weightQ5_K[8192 28672]
-
blk.74.ffn_up.weightQ5_K[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.weightQ5_K[8192 1024]
-
blk.74.attn_output.weightQ5_K[8192 8192]
-
blk.74.attn_q.weightQ5_K[8192 8192]
-
blk.74.attn_v.weightQ5_K[8192 1024]
-
blk.75.attn_k.weightQ5_K[8192 1024]
-
blk.75.attn_output.weightQ5_K[8192 8192]
-
blk.75.attn_q.weightQ5_K[8192 8192]
-
blk.75.attn_v.weightQ5_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ5_K[28672 8192]
-
blk.75.ffn_gate.weightQ5_K[8192 28672]
-
blk.75.ffn_up.weightQ5_K[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ5_K[28672 8192]
-
blk.76.ffn_gate.weightQ5_K[8192 28672]
-
blk.76.ffn_up.weightQ5_K[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ5_K[8192 1024]
-
blk.76.attn_output.weightQ5_K[8192 8192]
-
blk.76.attn_q.weightQ5_K[8192 8192]
-
blk.76.attn_v.weightQ5_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ5_K[28672 8192]
-
blk.77.ffn_gate.weightQ5_K[8192 28672]
-
blk.77.ffn_up.weightQ5_K[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.weightQ5_K[8192 1024]
-
blk.77.attn_output.weightQ5_K[8192 8192]
-
blk.77.attn_q.weightQ5_K[8192 8192]
-
blk.77.attn_v.weightQ5_K[8192 1024]
-
blk.78.attn_k.weightQ5_K[8192 1024]
-
blk.78.attn_q.weightQ5_K[8192 8192]
-
blk.78.attn_v.weightQ5_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ5_K[28672 8192]
-
blk.78.ffn_gate.weightQ5_K[8192 28672]
-
blk.78.ffn_up.weightQ5_K[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_output.weightQ5_K[8192 8192]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ5_K[28672 8192]
-
blk.79.ffn_gate.weightQ5_K[8192 28672]
-
blk.79.ffn_up.weightQ5_K[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ5_K[8192 1024]
-
blk.79.attn_output.weightQ5_K[8192 8192]
-
blk.79.attn_q.weightQ5_K[8192 8192]
-
blk.79.attn_v.weightQ5_K[8192 1024]
-
output.weightF16[8192 32001]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79