latest
62GB
54 Pulls Updated 7 months ago
cad221120528 · 62GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count120
-
llama.context_length32768
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[8192 32000]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ6_K[28672 8192]
-
blk.0.ffn_gate.weightQ4_K[8192 28672]
-
blk.0.ffn_up.weightQ4_K[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_K[8192 1024]
-
blk.0.attn_output.weightQ4_K[8192 8192]
-
blk.0.attn_q.weightQ4_K[8192 8192]
-
blk.0.attn_v.weightQ6_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ6_K[28672 8192]
-
blk.1.ffn_gate.weightQ4_K[8192 28672]
-
blk.1.ffn_up.weightQ4_K[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_K[8192 1024]
-
blk.1.attn_output.weightQ4_K[8192 8192]
-
blk.1.attn_q.weightQ4_K[8192 8192]
-
blk.1.attn_v.weightQ6_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ6_K[28672 8192]
-
blk.2.ffn_gate.weightQ4_K[8192 28672]
-
blk.2.ffn_up.weightQ4_K[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_K[8192 1024]
-
blk.2.attn_output.weightQ4_K[8192 8192]
-
blk.2.attn_q.weightQ4_K[8192 8192]
-
blk.2.attn_v.weightQ6_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ6_K[28672 8192]
-
blk.3.ffn_gate.weightQ4_K[8192 28672]
-
blk.3.ffn_up.weightQ4_K[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_K[8192 1024]
-
blk.3.attn_output.weightQ4_K[8192 8192]
-
blk.3.attn_q.weightQ4_K[8192 8192]
-
blk.3.attn_v.weightQ6_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ6_K[28672 8192]
-
blk.4.ffn_gate.weightQ4_K[8192 28672]
-
blk.4.ffn_up.weightQ4_K[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_K[8192 1024]
-
blk.4.attn_output.weightQ4_K[8192 8192]
-
blk.4.attn_q.weightQ4_K[8192 8192]
-
blk.4.attn_v.weightQ6_K[8192 1024]
-
blk.5.attn_k.weightQ4_K[8192 1024]
-
blk.5.attn_output.weightQ4_K[8192 8192]
-
blk.5.attn_q.weightQ4_K[8192 8192]
-
blk.5.attn_v.weightQ6_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ6_K[28672 8192]
-
blk.5.ffn_gate.weightQ4_K[8192 28672]
-
blk.5.ffn_up.weightQ4_K[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ6_K[28672 8192]
-
blk.6.ffn_gate.weightQ4_K[8192 28672]
-
blk.6.ffn_up.weightQ4_K[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_K[8192 1024]
-
blk.6.attn_output.weightQ4_K[8192 8192]
-
blk.6.attn_q.weightQ4_K[8192 8192]
-
blk.6.attn_v.weightQ6_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ6_K[28672 8192]
-
blk.7.ffn_gate.weightQ4_K[8192 28672]
-
blk.7.ffn_up.weightQ4_K[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_K[8192 1024]
-
blk.7.attn_output.weightQ4_K[8192 8192]
-
blk.7.attn_q.weightQ4_K[8192 8192]
-
blk.7.attn_v.weightQ6_K[8192 1024]
-
blk.8.attn_k.weightQ4_K[8192 1024]
-
blk.8.attn_q.weightQ4_K[8192 8192]
-
blk.8.attn_v.weightQ6_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ6_K[28672 8192]
-
blk.8.ffn_gate.weightQ4_K[8192 28672]
-
blk.8.ffn_up.weightQ4_K[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ6_K[28672 8192]
-
blk.9.ffn_gate.weightQ4_K[8192 28672]
-
blk.9.ffn_up.weightQ4_K[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_K[8192 1024]
-
blk.9.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_q.weightQ4_K[8192 8192]
-
blk.9.attn_v.weightQ6_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ6_K[28672 8192]
-
blk.10.ffn_gate.weightQ4_K[8192 28672]
-
blk.10.ffn_up.weightQ4_K[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_K[8192 1024]
-
blk.10.attn_output.weightQ4_K[8192 8192]
-
blk.10.attn_q.weightQ4_K[8192 8192]
-
blk.10.attn_v.weightQ6_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ6_K[28672 8192]
-
blk.11.ffn_gate.weightQ4_K[8192 28672]
-
blk.11.ffn_up.weightQ4_K[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_K[8192 1024]
-
blk.11.attn_output.weightQ4_K[8192 8192]
-
blk.11.attn_q.weightQ4_K[8192 8192]
-
blk.11.attn_v.weightQ6_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ6_K[28672 8192]
-
blk.12.ffn_gate.weightQ4_K[8192 28672]
-
blk.12.ffn_up.weightQ4_K[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ4_K[8192 1024]
-
blk.12.attn_output.weightQ4_K[8192 8192]
-
blk.12.attn_q.weightQ4_K[8192 8192]
-
blk.12.attn_v.weightQ6_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ6_K[28672 8192]
-
blk.13.ffn_gate.weightQ4_K[8192 28672]
-
blk.13.ffn_up.weightQ4_K[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_K[8192 1024]
-
blk.13.attn_output.weightQ4_K[8192 8192]
-
blk.13.attn_q.weightQ4_K[8192 8192]
-
blk.13.attn_v.weightQ6_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ6_K[28672 8192]
-
blk.14.ffn_gate.weightQ4_K[8192 28672]
-
blk.14.ffn_up.weightQ4_K[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_K[8192 1024]
-
blk.14.attn_output.weightQ4_K[8192 8192]
-
blk.14.attn_q.weightQ4_K[8192 8192]
-
blk.14.attn_v.weightQ6_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_K[28672 8192]
-
blk.15.ffn_gate.weightQ4_K[8192 28672]
-
blk.15.ffn_up.weightQ4_K[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_K[8192 1024]
-
blk.15.attn_output.weightQ4_K[8192 8192]
-
blk.15.attn_q.weightQ4_K[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.16.ffn_gate.weightQ4_K[8192 28672]
-
blk.16.attn_k.weightQ4_K[8192 1024]
-
blk.16.attn_output.weightQ4_K[8192 8192]
-
blk.16.attn_q.weightQ4_K[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_K[28672 8192]
-
blk.16.ffn_up.weightQ4_K[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ6_K[28672 8192]
-
blk.17.ffn_gate.weightQ4_K[8192 28672]
-
blk.17.ffn_up.weightQ4_K[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_K[8192 1024]
-
blk.17.attn_output.weightQ4_K[8192 8192]
-
blk.17.attn_q.weightQ4_K[8192 8192]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_K[28672 8192]
-
blk.18.ffn_gate.weightQ4_K[8192 28672]
-
blk.18.ffn_up.weightQ4_K[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ4_K[8192 1024]
-
blk.18.attn_output.weightQ4_K[8192 8192]
-
blk.18.attn_q.weightQ4_K[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_k.weightQ4_K[8192 1024]
-
blk.19.attn_output.weightQ4_K[8192 8192]
-
blk.19.attn_q.weightQ4_K[8192 8192]
-
blk.19.attn_v.weightQ6_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ6_K[28672 8192]
-
blk.19.ffn_gate.weightQ4_K[8192 28672]
-
blk.19.ffn_up.weightQ4_K[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_K[28672 8192]
-
blk.20.ffn_gate.weightQ4_K[8192 28672]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_up.weightQ4_K[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_K[8192 1024]
-
blk.20.attn_output.weightQ4_K[8192 8192]
-
blk.20.attn_q.weightQ4_K[8192 8192]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ6_K[28672 8192]
-
blk.21.ffn_gate.weightQ4_K[8192 28672]
-
blk.21.ffn_up.weightQ4_K[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ4_K[8192 1024]
-
blk.21.attn_output.weightQ4_K[8192 8192]
-
blk.21.attn_q.weightQ4_K[8192 8192]
-
blk.21.attn_v.weightQ6_K[8192 1024]
-
blk.22.attn_k.weightQ4_K[8192 1024]
-
blk.22.attn_q.weightQ4_K[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_K[28672 8192]
-
blk.22.ffn_gate.weightQ4_K[8192 28672]
-
blk.22.ffn_up.weightQ4_K[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_K[28672 8192]
-
blk.23.ffn_gate.weightQ4_K[8192 28672]
-
blk.23.ffn_up.weightQ4_K[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_K[8192 1024]
-
blk.23.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_q.weightQ4_K[8192 8192]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_K[28672 8192]
-
blk.24.ffn_gate.weightQ4_K[8192 28672]
-
blk.24.ffn_up.weightQ4_K[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_K[8192 1024]
-
blk.24.attn_output.weightQ4_K[8192 8192]
-
blk.24.attn_q.weightQ4_K[8192 8192]
-
blk.24.attn_v.weightQ6_K[8192 1024]
-
blk.25.ffn_down.weightQ6_K[28672 8192]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_gate.weightQ4_K[8192 28672]
-
blk.25.ffn_up.weightQ4_K[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_K[8192 1024]
-
blk.25.attn_output.weightQ4_K[8192 8192]
-
blk.25.attn_q.weightQ4_K[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_K[28672 8192]
-
blk.26.ffn_gate.weightQ4_K[8192 28672]
-
blk.26.ffn_up.weightQ4_K[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_K[8192 1024]
-
blk.26.attn_output.weightQ4_K[8192 8192]
-
blk.26.attn_q.weightQ4_K[8192 8192]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.27.ffn_gate.weightQ4_K[8192 28672]
-
blk.27.ffn_up.weightQ4_K[8192 28672]
-
blk.27.attn_k.weightQ4_K[8192 1024]
-
blk.27.attn_output.weightQ4_K[8192 8192]
-
blk.27.attn_q.weightQ4_K[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ6_K[28672 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_K[28672 8192]
-
blk.28.ffn_gate.weightQ4_K[8192 28672]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_up.weightQ4_K[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_K[8192 1024]
-
blk.28.attn_output.weightQ4_K[8192 8192]
-
blk.28.attn_q.weightQ4_K[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ6_K[28672 8192]
-
blk.29.ffn_gate.weightQ4_K[8192 28672]
-
blk.29.ffn_up.weightQ4_K[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_K[8192 1024]
-
blk.29.attn_output.weightQ4_K[8192 8192]
-
blk.29.attn_q.weightQ4_K[8192 8192]
-
blk.29.attn_v.weightQ6_K[8192 1024]
-
blk.30.ffn_gate.weightQ4_K[8192 28672]
-
blk.30.attn_k.weightQ4_K[8192 1024]
-
blk.30.attn_output.weightQ4_K[8192 8192]
-
blk.30.attn_q.weightQ4_K[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_K[28672 8192]
-
blk.30.ffn_up.weightQ4_K[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_K[28672 8192]
-
blk.31.ffn_gate.weightQ4_K[8192 28672]
-
blk.31.ffn_up.weightQ4_K[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_K[8192 1024]
-
blk.31.attn_output.weightQ4_K[8192 8192]
-
blk.31.attn_q.weightQ4_K[8192 8192]
-
blk.31.attn_v.weightQ6_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_K[28672 8192]
-
blk.32.ffn_gate.weightQ4_K[8192 28672]
-
blk.32.ffn_up.weightQ4_K[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_K[8192 1024]
-
blk.32.attn_output.weightQ4_K[8192 8192]
-
blk.32.attn_q.weightQ4_K[8192 8192]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_k.weightQ4_K[8192 1024]
-
blk.33.attn_output.weightQ4_K[8192 8192]
-
blk.33.attn_q.weightQ4_K[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.33.ffn_down.weightQ4_K[28672 8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_gate.weightQ4_K[8192 28672]
-
blk.33.ffn_up.weightQ4_K[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ6_K[28672 8192]
-
blk.34.ffn_gate.weightQ4_K[8192 28672]
-
blk.34.ffn_up.weightQ4_K[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_K[8192 1024]
-
blk.34.attn_output.weightQ4_K[8192 8192]
-
blk.34.attn_q.weightQ4_K[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_K[28672 8192]
-
blk.35.ffn_gate.weightQ4_K[8192 28672]
-
blk.35.ffn_up.weightQ4_K[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_K[8192 1024]
-
blk.35.attn_output.weightQ4_K[8192 8192]
-
blk.35.attn_q.weightQ4_K[8192 8192]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.36.attn_k.weightQ4_K[8192 1024]
-
blk.36.attn_q.weightQ4_K[8192 8192]
-
blk.36.attn_v.weightQ6_K[8192 1024]
-
blk.36.ffn_down.weightQ4_K[28672 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_gate.weightQ4_K[8192 28672]
-
blk.36.ffn_up.weightQ4_K[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ6_K[28672 8192]
-
blk.37.ffn_gate.weightQ4_K[8192 28672]
-
blk.37.ffn_up.weightQ4_K[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_K[8192 1024]
-
blk.37.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_q.weightQ4_K[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_K[28672 8192]
-
blk.38.ffn_gate.weightQ4_K[8192 28672]
-
blk.38.ffn_up.weightQ4_K[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_K[8192 1024]
-
blk.38.attn_output.weightQ4_K[8192 8192]
-
blk.38.attn_q.weightQ4_K[8192 8192]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.ffn_down.weightQ4_K[28672 8192]
-
blk.39.ffn_gate.weightQ4_K[8192 28672]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_up.weightQ4_K[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_K[8192 1024]
-
blk.39.attn_output.weightQ4_K[8192 8192]
-
blk.39.attn_q.weightQ4_K[8192 8192]
-
blk.39.attn_v.weightQ6_K[8192 1024]
-
blk.40.ffn_down.weightQ4_K[28672 8192]
-
blk.40.ffn_gate.weightQ4_K[8192 28672]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_up.weightQ4_K[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_K[8192 1024]
-
blk.40.attn_output.weightQ4_K[8192 8192]
-
blk.40.attn_q.weightQ4_K[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_K[28672 8192]
-
blk.41.ffn_gate.weightQ4_K[8192 28672]
-
blk.41.ffn_up.weightQ4_K[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightQ4_K[8192 1024]
-
blk.41.attn_output.weightQ4_K[8192 8192]
-
blk.41.attn_q.weightQ4_K[8192 8192]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_k.weightQ4_K[8192 1024]
-
blk.42.attn_q.weightQ4_K[8192 8192]
-
blk.42.attn_v.weightQ6_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_K[28672 8192]
-
blk.42.ffn_gate.weightQ4_K[8192 28672]
-
blk.42.ffn_up.weightQ4_K[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_output.weightQ4_K[8192 8192]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ6_K[28672 8192]
-
blk.43.ffn_gate.weightQ4_K[8192 28672]
-
blk.43.ffn_up.weightQ4_K[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_K[8192 1024]
-
blk.43.attn_output.weightQ4_K[8192 8192]
-
blk.43.attn_q.weightQ4_K[8192 8192]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_K[28672 8192]
-
blk.44.ffn_gate.weightQ4_K[8192 28672]
-
blk.44.ffn_up.weightQ4_K[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ4_K[8192 1024]
-
blk.44.attn_output.weightQ4_K[8192 8192]
-
blk.44.attn_q.weightQ4_K[8192 8192]
-
blk.44.attn_v.weightQ6_K[8192 1024]
-
blk.45.ffn_down.weightQ6_K[28672 8192]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_gate.weightQ4_K[8192 28672]
-
blk.45.ffn_up.weightQ4_K[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_K[8192 1024]
-
blk.45.attn_output.weightQ4_K[8192 8192]
-
blk.45.attn_q.weightQ4_K[8192 8192]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_K[28672 8192]
-
blk.46.ffn_gate.weightQ4_K[8192 28672]
-
blk.46.ffn_up.weightQ4_K[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_K[8192 1024]
-
blk.46.attn_output.weightQ4_K[8192 8192]
-
blk.46.attn_q.weightQ4_K[8192 8192]
-
blk.46.attn_v.weightQ6_K[8192 1024]
-
blk.47.ffn_gate.weightQ4_K[8192 28672]
-
blk.47.ffn_up.weightQ4_K[8192 28672]
-
blk.47.attn_k.weightQ4_K[8192 1024]
-
blk.47.attn_output.weightQ4_K[8192 8192]
-
blk.47.attn_q.weightQ4_K[8192 8192]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ6_K[28672 8192]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_K[28672 8192]
-
blk.48.ffn_gate.weightQ4_K[8192 28672]
-
blk.48.ffn_up.weightQ4_K[8192 28672]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_K[8192 1024]
-
blk.48.attn_output.weightQ4_K[8192 8192]
-
blk.48.attn_q.weightQ4_K[8192 8192]
-
blk.48.attn_v.weightQ6_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_K[28672 8192]
-
blk.49.ffn_gate.weightQ4_K[8192 28672]
-
blk.49.ffn_up.weightQ4_K[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.weightQ4_K[8192 1024]
-
blk.49.attn_output.weightQ4_K[8192 8192]
-
blk.49.attn_q.weightQ4_K[8192 8192]
-
blk.49.attn_v.weightQ6_K[8192 1024]
-
blk.50.ffn_gate.weightQ4_K[8192 28672]
-
blk.50.attn_k.weightQ4_K[8192 1024]
-
blk.50.attn_output.weightQ4_K[8192 8192]
-
blk.50.attn_q.weightQ4_K[8192 8192]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.50.ffn_down.weightQ4_K[28672 8192]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_up.weightQ4_K[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_K[28672 8192]
-
blk.51.ffn_gate.weightQ4_K[8192 28672]
-
blk.51.ffn_up.weightQ4_K[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_K[8192 1024]
-
blk.51.attn_output.weightQ4_K[8192 8192]
-
blk.51.attn_q.weightQ4_K[8192 8192]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ6_K[28672 8192]
-
blk.52.ffn_gate.weightQ4_K[8192 28672]
-
blk.52.ffn_up.weightQ4_K[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_K[8192 1024]
-
blk.52.attn_output.weightQ4_K[8192 8192]
-
blk.52.attn_q.weightQ4_K[8192 8192]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_k.weightQ4_K[8192 1024]
-
blk.53.attn_output.weightQ4_K[8192 8192]
-
blk.53.attn_q.weightQ4_K[8192 8192]
-
blk.53.attn_v.weightQ6_K[8192 1024]
-
blk.53.ffn_down.weightQ4_K[28672 8192]
-
blk.53.ffn_gate.weightQ4_K[8192 28672]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_up.weightQ4_K[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ6_K[28672 8192]
-
blk.54.ffn_gate.weightQ4_K[8192 28672]
-
blk.54.ffn_up.weightQ4_K[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.weightQ4_K[8192 1024]
-
blk.54.attn_output.weightQ4_K[8192 8192]
-
blk.54.attn_q.weightQ4_K[8192 8192]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_K[28672 8192]
-
blk.55.ffn_gate.weightQ4_K[8192 28672]
-
blk.55.ffn_up.weightQ4_K[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightQ4_K[8192 1024]
-
blk.55.attn_output.weightQ4_K[8192 8192]
-
blk.55.attn_q.weightQ4_K[8192 8192]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_k.weightQ4_K[8192 1024]
-
blk.56.attn_q.weightQ4_K[8192 8192]
-
blk.56.attn_v.weightQ6_K[8192 1024]
-
blk.56.ffn_down.weightQ4_K[28672 8192]
-
blk.56.ffn_gate.weightQ4_K[8192 28672]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_up.weightQ4_K[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_output.weightQ4_K[8192 8192]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ6_K[28672 8192]
-
blk.57.ffn_gate.weightQ4_K[8192 28672]
-
blk.57.ffn_up.weightQ4_K[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.weightQ4_K[8192 1024]
-
blk.57.attn_output.weightQ4_K[8192 8192]
-
blk.57.attn_q.weightQ4_K[8192 8192]
-
blk.57.attn_v.weightQ6_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_K[28672 8192]
-
blk.58.ffn_gate.weightQ4_K[8192 28672]
-
blk.58.ffn_up.weightQ4_K[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightQ4_K[8192 1024]
-
blk.58.attn_output.weightQ4_K[8192 8192]
-
blk.58.attn_q.weightQ4_K[8192 8192]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.59.ffn_down.weightQ6_K[28672 8192]
-
blk.59.ffn_gate.weightQ4_K[8192 28672]
-
blk.59.ffn_up.weightQ4_K[8192 28672]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_K[8192 1024]
-
blk.59.attn_output.weightQ4_K[8192 8192]
-
blk.59.attn_q.weightQ4_K[8192 8192]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_K[28672 8192]
-
blk.60.ffn_gate.weightQ4_K[8192 28672]
-
blk.60.ffn_up.weightQ4_K[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.weightQ4_K[8192 1024]
-
blk.60.attn_output.weightQ4_K[8192 8192]
-
blk.60.attn_q.weightQ4_K[8192 8192]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.61.ffn_gate.weightQ4_K[8192 28672]
-
blk.61.ffn_up.weightQ4_K[8192 28672]
-
blk.61.attn_k.weightQ4_K[8192 1024]
-
blk.61.attn_output.weightQ4_K[8192 8192]
-
blk.61.attn_q.weightQ4_K[8192 8192]
-
blk.61.attn_v.weightQ6_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_K[28672 8192]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ6_K[28672 8192]
-
blk.62.ffn_gate.weightQ4_K[8192 28672]
-
blk.62.ffn_up.weightQ4_K[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_K[8192 1024]
-
blk.62.attn_output.weightQ4_K[8192 8192]
-
blk.62.attn_q.weightQ4_K[8192 8192]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_K[28672 8192]
-
blk.63.ffn_gate.weightQ4_K[8192 28672]
-
blk.63.ffn_up.weightQ4_K[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.weightQ4_K[8192 1024]
-
blk.63.attn_output.weightQ4_K[8192 8192]
-
blk.63.attn_q.weightQ4_K[8192 8192]
-
blk.63.attn_v.weightQ6_K[8192 1024]
-
blk.64.ffn_gate.weightQ4_K[8192 28672]
-
blk.64.attn_k.weightQ4_K[8192 1024]
-
blk.64.attn_output.weightQ4_K[8192 8192]
-
blk.64.attn_q.weightQ4_K[8192 8192]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ6_K[28672 8192]
-
blk.64.ffn_up.weightQ4_K[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_K[28672 8192]
-
blk.65.ffn_gate.weightQ4_K[8192 28672]
-
blk.65.ffn_up.weightQ4_K[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_K[8192 1024]
-
blk.65.attn_output.weightQ4_K[8192 8192]
-
blk.65.attn_q.weightQ4_K[8192 8192]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_K[28672 8192]
-
blk.66.ffn_gate.weightQ4_K[8192 28672]
-
blk.66.ffn_up.weightQ4_K[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_K[8192 1024]
-
blk.66.attn_output.weightQ4_K[8192 8192]
-
blk.66.attn_q.weightQ4_K[8192 8192]
-
blk.66.attn_v.weightQ6_K[8192 1024]
-
blk.67.attn_k.weightQ4_K[8192 1024]
-
blk.67.attn_output.weightQ4_K[8192 8192]
-
blk.67.attn_q.weightQ4_K[8192 8192]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ6_K[28672 8192]
-
blk.67.ffn_gate.weightQ4_K[8192 28672]
-
blk.67.ffn_up.weightQ4_K[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_K[28672 8192]
-
blk.68.ffn_gate.weightQ4_K[8192 28672]
-
blk.68.ffn_up.weightQ4_K[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.weightQ4_K[8192 1024]
-
blk.68.attn_output.weightQ4_K[8192 8192]
-
blk.68.attn_q.weightQ4_K[8192 8192]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_K[28672 8192]
-
blk.69.ffn_gate.weightQ4_K[8192 28672]
-
blk.69.ffn_up.weightQ4_K[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightQ4_K[8192 1024]
-
blk.69.attn_output.weightQ4_K[8192 8192]
-
blk.69.attn_q.weightQ4_K[8192 8192]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_k.weightQ4_K[8192 1024]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_q.weightQ4_K[8192 8192]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ6_K[28672 8192]
-
blk.70.ffn_gate.weightQ4_K[8192 28672]
-
blk.70.ffn_up.weightQ4_K[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_output.weightQ4_K[8192 8192]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_K[28672 8192]
-
blk.71.ffn_gate.weightQ4_K[8192 28672]
-
blk.71.ffn_up.weightQ4_K[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.weightQ4_K[8192 1024]
-
blk.71.attn_output.weightQ4_K[8192 8192]
-
blk.71.attn_q.weightQ4_K[8192 8192]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_K[28672 8192]
-
blk.72.ffn_gate.weightQ4_K[8192 28672]
-
blk.72.ffn_up.weightQ4_K[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightQ4_K[8192 1024]
-
blk.72.attn_output.weightQ4_K[8192 8192]
-
blk.72.attn_q.weightQ4_K[8192 8192]
-
blk.72.attn_v.weightQ6_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ6_K[28672 8192]
-
blk.73.ffn_gate.weightQ4_K[8192 28672]
-
blk.73.ffn_up.weightQ4_K[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_K[8192 1024]
-
blk.73.attn_output.weightQ4_K[8192 8192]
-
blk.73.attn_q.weightQ4_K[8192 8192]
-
blk.73.attn_v.weightQ6_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_K[28672 8192]
-
blk.74.ffn_gate.weightQ4_K[8192 28672]
-
blk.74.ffn_up.weightQ4_K[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.weightQ4_K[8192 1024]
-
blk.74.attn_output.weightQ4_K[8192 8192]
-
blk.74.attn_q.weightQ4_K[8192 8192]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.75.ffn_gate.weightQ4_K[8192 28672]
-
blk.75.ffn_up.weightQ4_K[8192 28672]
-
blk.75.attn_k.weightQ4_K[8192 1024]
-
blk.75.attn_output.weightQ4_K[8192 8192]
-
blk.75.attn_q.weightQ4_K[8192 8192]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_K[28672 8192]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ6_K[28672 8192]
-
blk.76.ffn_gate.weightQ4_K[8192 28672]
-
blk.76.ffn_up.weightQ4_K[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_K[8192 1024]
-
blk.76.attn_output.weightQ4_K[8192 8192]
-
blk.76.attn_q.weightQ4_K[8192 8192]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_K[28672 8192]
-
blk.77.ffn_gate.weightQ4_K[8192 28672]
-
blk.77.ffn_up.weightQ4_K[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.weightQ4_K[8192 1024]
-
blk.77.attn_output.weightQ4_K[8192 8192]
-
blk.77.attn_q.weightQ4_K[8192 8192]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.78.ffn_gate.weightQ4_K[8192 28672]
-
blk.78.attn_k.weightQ4_K[8192 1024]
-
blk.78.attn_output.weightQ4_K[8192 8192]
-
blk.78.attn_q.weightQ4_K[8192 8192]
-
blk.78.attn_v.weightQ6_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_K[28672 8192]
-
blk.78.ffn_up.weightQ4_K[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_K[28672 8192]
-
blk.79.ffn_gate.weightQ4_K[8192 28672]
-
blk.79.ffn_up.weightQ4_K[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_K[8192 1024]
-
blk.79.attn_output.weightQ4_K[8192 8192]
-
blk.79.attn_q.weightQ4_K[8192 8192]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
blk.80.attn_norm.weightF32[8192]
-
blk.80.ffn_down.weightQ4_K[28672 8192]
-
blk.80.ffn_gate.weightQ4_K[8192 28672]
-
blk.80.ffn_up.weightQ4_K[8192 28672]
-
blk.80.ffn_norm.weightF32[8192]
-
blk.80.attn_k.weightQ4_K[8192 1024]
-
blk.80.attn_output.weightQ4_K[8192 8192]
-
blk.80.attn_q.weightQ4_K[8192 8192]
-
blk.80.attn_v.weightQ4_K[8192 1024]
-
blk.81.ffn_gate.weightQ4_K[8192 28672]
-
blk.81.ffn_up.weightQ4_K[8192 28672]
-
blk.81.attn_k.weightQ4_K[8192 1024]
-
blk.81.attn_output.weightQ4_K[8192 8192]
-
blk.81.attn_q.weightQ4_K[8192 8192]
-
blk.81.attn_v.weightQ4_K[8192 1024]
-
blk.81.ffn_down.weightQ4_K[28672 8192]
-
blk.81.attn_norm.weightF32[8192]
-
blk.81.ffn_norm.weightF32[8192]
-
blk.82.attn_norm.weightF32[8192]
-
blk.82.ffn_down.weightQ6_K[28672 8192]
-
blk.82.ffn_gate.weightQ4_K[8192 28672]
-
blk.82.ffn_up.weightQ4_K[8192 28672]
-
blk.82.ffn_norm.weightF32[8192]
-
blk.82.attn_k.weightQ4_K[8192 1024]
-
blk.82.attn_output.weightQ4_K[8192 8192]
-
blk.82.attn_q.weightQ4_K[8192 8192]
-
blk.82.attn_v.weightQ4_K[8192 1024]
-
blk.83.attn_norm.weightF32[8192]
-
blk.83.ffn_down.weightQ4_K[28672 8192]
-
blk.83.ffn_gate.weightQ4_K[8192 28672]
-
blk.83.ffn_up.weightQ4_K[8192 28672]
-
blk.83.ffn_norm.weightF32[8192]
-
blk.83.attn_k.weightQ4_K[8192 1024]
-
blk.83.attn_output.weightQ4_K[8192 8192]
-
blk.83.attn_q.weightQ4_K[8192 8192]
-
blk.83.attn_v.weightQ6_K[8192 1024]
-
blk.84.ffn_gate.weightQ4_K[8192 28672]
-
blk.84.attn_k.weightQ4_K[8192 1024]
-
blk.84.attn_output.weightQ4_K[8192 8192]
-
blk.84.attn_q.weightQ4_K[8192 8192]
-
blk.84.attn_v.weightQ4_K[8192 1024]
-
blk.84.attn_norm.weightF32[8192]
-
blk.84.ffn_down.weightQ6_K[28672 8192]
-
blk.84.ffn_up.weightQ4_K[8192 28672]
-
blk.84.ffn_norm.weightF32[8192]
-
blk.85.attn_norm.weightF32[8192]
-
blk.85.ffn_down.weightQ4_K[28672 8192]
-
blk.85.ffn_gate.weightQ4_K[8192 28672]
-
blk.85.ffn_up.weightQ4_K[8192 28672]
-
blk.85.ffn_norm.weightF32[8192]
-
blk.85.attn_k.weightQ4_K[8192 1024]
-
blk.85.attn_output.weightQ4_K[8192 8192]
-
blk.85.attn_q.weightQ4_K[8192 8192]
-
blk.85.attn_v.weightQ6_K[8192 1024]
-
blk.86.attn_norm.weightF32[8192]
-
blk.86.ffn_down.weightQ4_K[28672 8192]
-
blk.86.ffn_gate.weightQ4_K[8192 28672]
-
blk.86.ffn_up.weightQ4_K[8192 28672]
-
blk.86.ffn_norm.weightF32[8192]
-
blk.86.attn_k.weightQ4_K[8192 1024]
-
blk.86.attn_output.weightQ4_K[8192 8192]
-
blk.86.attn_q.weightQ4_K[8192 8192]
-
blk.86.attn_v.weightQ4_K[8192 1024]
-
blk.87.attn_k.weightQ4_K[8192 1024]
-
blk.87.attn_output.weightQ4_K[8192 8192]
-
blk.87.attn_q.weightQ4_K[8192 8192]
-
blk.87.attn_v.weightQ4_K[8192 1024]
-
blk.87.attn_norm.weightF32[8192]
-
blk.87.ffn_down.weightQ6_K[28672 8192]
-
blk.87.ffn_gate.weightQ4_K[8192 28672]
-
blk.87.ffn_up.weightQ4_K[8192 28672]
-
blk.87.ffn_norm.weightF32[8192]
-
blk.88.attn_norm.weightF32[8192]
-
blk.88.ffn_down.weightQ4_K[28672 8192]
-
blk.88.ffn_gate.weightQ4_K[8192 28672]
-
blk.88.ffn_up.weightQ4_K[8192 28672]
-
blk.88.ffn_norm.weightF32[8192]
-
blk.88.attn_k.weightQ4_K[8192 1024]
-
blk.88.attn_output.weightQ4_K[8192 8192]
-
blk.88.attn_q.weightQ4_K[8192 8192]
-
blk.88.attn_v.weightQ6_K[8192 1024]
-
blk.89.attn_norm.weightF32[8192]
-
blk.89.ffn_down.weightQ4_K[28672 8192]
-
blk.89.ffn_gate.weightQ4_K[8192 28672]
-
blk.89.ffn_up.weightQ4_K[8192 28672]
-
blk.89.ffn_norm.weightF32[8192]
-
blk.89.attn_k.weightQ4_K[8192 1024]
-
blk.89.attn_output.weightQ4_K[8192 8192]
-
blk.89.attn_q.weightQ4_K[8192 8192]
-
blk.89.attn_v.weightQ4_K[8192 1024]
-
blk.90.attn_k.weightQ4_K[8192 1024]
-
blk.90.attn_q.weightQ4_K[8192 8192]
-
blk.90.attn_v.weightQ6_K[8192 1024]
-
blk.90.attn_norm.weightF32[8192]
-
blk.90.ffn_down.weightQ6_K[28672 8192]
-
blk.90.ffn_gate.weightQ4_K[8192 28672]
-
blk.90.ffn_up.weightQ4_K[8192 28672]
-
blk.90.ffn_norm.weightF32[8192]
-
blk.90.attn_output.weightQ4_K[8192 8192]
-
blk.91.attn_norm.weightF32[8192]
-
blk.91.ffn_down.weightQ4_K[28672 8192]
-
blk.91.ffn_gate.weightQ4_K[8192 28672]
-
blk.91.ffn_up.weightQ4_K[8192 28672]
-
blk.91.ffn_norm.weightF32[8192]
-
blk.91.attn_k.weightQ4_K[8192 1024]
-
blk.91.attn_output.weightQ4_K[8192 8192]
-
blk.91.attn_q.weightQ4_K[8192 8192]
-
blk.91.attn_v.weightQ4_K[8192 1024]
-
blk.92.attn_norm.weightF32[8192]
-
blk.92.ffn_down.weightQ4_K[28672 8192]
-
blk.92.ffn_gate.weightQ4_K[8192 28672]
-
blk.92.ffn_up.weightQ4_K[8192 28672]
-
blk.92.ffn_norm.weightF32[8192]
-
blk.92.attn_k.weightQ4_K[8192 1024]
-
blk.92.attn_output.weightQ4_K[8192 8192]
-
blk.92.attn_q.weightQ4_K[8192 8192]
-
blk.92.attn_v.weightQ4_K[8192 1024]
-
blk.93.attn_norm.weightF32[8192]
-
blk.93.ffn_down.weightQ4_K[28672 8192]
-
blk.93.ffn_gate.weightQ4_K[8192 28672]
-
blk.93.ffn_up.weightQ4_K[8192 28672]
-
blk.93.ffn_norm.weightF32[8192]
-
blk.93.attn_k.weightQ4_K[8192 1024]
-
blk.93.attn_output.weightQ4_K[8192 8192]
-
blk.93.attn_q.weightQ4_K[8192 8192]
-
blk.93.attn_v.weightQ6_K[8192 1024]
-
blk.94.attn_norm.weightF32[8192]
-
blk.94.ffn_down.weightQ6_K[28672 8192]
-
blk.94.ffn_gate.weightQ4_K[8192 28672]
-
blk.94.ffn_up.weightQ4_K[8192 28672]
-
blk.94.ffn_norm.weightF32[8192]
-
blk.94.attn_k.weightQ4_K[8192 1024]
-
blk.94.attn_output.weightQ4_K[8192 8192]
-
blk.94.attn_q.weightQ4_K[8192 8192]
-
blk.94.attn_v.weightQ4_K[8192 1024]
-
blk.95.ffn_gate.weightQ4_K[8192 28672]
-
blk.95.ffn_up.weightQ4_K[8192 28672]
-
blk.95.attn_k.weightQ4_K[8192 1024]
-
blk.95.attn_output.weightQ4_K[8192 8192]
-
blk.95.attn_q.weightQ4_K[8192 8192]
-
blk.95.attn_v.weightQ4_K[8192 1024]
-
blk.95.attn_norm.weightF32[8192]
-
blk.95.ffn_down.weightQ4_K[28672 8192]
-
blk.95.ffn_norm.weightF32[8192]
-
blk.96.attn_norm.weightF32[8192]
-
blk.96.ffn_down.weightQ6_K[28672 8192]
-
blk.96.ffn_gate.weightQ4_K[8192 28672]
-
blk.96.ffn_up.weightQ4_K[8192 28672]
-
blk.96.ffn_norm.weightF32[8192]
-
blk.96.attn_k.weightQ4_K[8192 1024]
-
blk.96.attn_output.weightQ4_K[8192 8192]
-
blk.96.attn_q.weightQ4_K[8192 8192]
-
blk.96.attn_v.weightQ4_K[8192 1024]
-
blk.97.attn_norm.weightF32[8192]
-
blk.97.ffn_down.weightQ4_K[28672 8192]
-
blk.97.ffn_gate.weightQ4_K[8192 28672]
-
blk.97.ffn_up.weightQ4_K[8192 28672]
-
blk.97.ffn_norm.weightF32[8192]
-
blk.97.attn_k.weightQ4_K[8192 1024]
-
blk.97.attn_output.weightQ4_K[8192 8192]
-
blk.97.attn_q.weightQ4_K[8192 8192]
-
blk.97.attn_v.weightQ4_K[8192 1024]
-
blk.98.ffn_gate.weightQ4_K[8192 28672]
-
blk.98.attn_k.weightQ4_K[8192 1024]
-
blk.98.attn_output.weightQ4_K[8192 8192]
-
blk.98.attn_q.weightQ4_K[8192 8192]
-
blk.98.attn_v.weightQ6_K[8192 1024]
-
blk.98.attn_norm.weightF32[8192]
-
blk.98.ffn_down.weightQ6_K[28672 8192]
-
blk.98.ffn_up.weightQ4_K[8192 28672]
-
blk.98.ffn_norm.weightF32[8192]
-
blk.99.attn_norm.weightF32[8192]
-
blk.99.ffn_down.weightQ4_K[28672 8192]
-
blk.99.ffn_gate.weightQ4_K[8192 28672]
-
blk.99.ffn_up.weightQ4_K[8192 28672]
-
blk.99.ffn_norm.weightF32[8192]
-
blk.99.attn_k.weightQ4_K[8192 1024]
-
blk.99.attn_output.weightQ4_K[8192 8192]
-
blk.99.attn_q.weightQ4_K[8192 8192]
-
blk.99.attn_v.weightQ6_K[8192 1024]
-
blk.100.ffn_down.weightQ4_K[28672 8192]
-
blk.100.attn_norm.weightF32[8192]
-
blk.100.ffn_gate.weightQ4_K[8192 28672]
-
blk.100.ffn_up.weightQ4_K[8192 28672]
-
blk.100.ffn_norm.weightF32[8192]
-
blk.100.attn_k.weightQ4_K[8192 1024]
-
blk.100.attn_output.weightQ4_K[8192 8192]
-
blk.100.attn_q.weightQ4_K[8192 8192]
-
blk.100.attn_v.weightQ4_K[8192 1024]
-
blk.101.attn_k.weightQ4_K[8192 1024]
-
blk.101.attn_output.weightQ4_K[8192 8192]
-
blk.101.attn_q.weightQ4_K[8192 8192]
-
blk.101.attn_v.weightQ6_K[8192 1024]
-
blk.101.attn_norm.weightF32[8192]
-
blk.101.ffn_down.weightQ4_K[28672 8192]
-
blk.101.ffn_gate.weightQ4_K[8192 28672]
-
blk.101.ffn_up.weightQ4_K[8192 28672]
-
blk.101.ffn_norm.weightF32[8192]
-
blk.102.ffn_down.weightQ4_K[28672 8192]
-
blk.102.ffn_gate.weightQ4_K[8192 28672]
-
blk.102.ffn_up.weightQ4_K[8192 28672]
-
blk.102.ffn_norm.weightF32[8192]
-
blk.102.attn_k.weightQ4_K[8192 1024]
-
blk.102.attn_output.weightQ4_K[8192 8192]
-
blk.102.attn_v.weightQ4_K[8192 1024]
-
blk.102.attn_norm.weightF32[8192]
-
blk.102.attn_q.weightQ4_K[8192 8192]
-
blk.103.attn_norm.weightF32[8192]
-
blk.103.ffn_down.weightQ6_K[28672 8192]
-
blk.103.ffn_gate.weightQ4_K[8192 28672]
-
blk.103.ffn_up.weightQ4_K[8192 28672]
-
blk.103.ffn_norm.weightF32[8192]
-
blk.103.attn_k.weightQ4_K[8192 1024]
-
blk.103.attn_output.weightQ4_K[8192 8192]
-
blk.103.attn_q.weightQ4_K[8192 8192]
-
blk.103.attn_v.weightQ6_K[8192 1024]
-
blk.104.attn_k.weightQ4_K[8192 1024]
-
blk.104.attn_q.weightQ4_K[8192 8192]
-
blk.104.attn_v.weightQ4_K[8192 1024]
-
blk.104.attn_norm.weightF32[8192]
-
blk.104.ffn_down.weightQ6_K[28672 8192]
-
blk.104.ffn_gate.weightQ4_K[8192 28672]
-
blk.104.ffn_up.weightQ4_K[8192 28672]
-
blk.104.ffn_norm.weightF32[8192]
-
blk.104.attn_output.weightQ4_K[8192 8192]
-
blk.105.attn_norm.weightF32[8192]
-
blk.105.ffn_down.weightQ6_K[28672 8192]
-
blk.105.ffn_gate.weightQ4_K[8192 28672]
-
blk.105.ffn_up.weightQ4_K[8192 28672]
-
blk.105.ffn_norm.weightF32[8192]
-
blk.105.attn_k.weightQ4_K[8192 1024]
-
blk.105.attn_output.weightQ4_K[8192 8192]
-
blk.105.attn_q.weightQ4_K[8192 8192]
-
blk.105.attn_v.weightQ6_K[8192 1024]
-
blk.106.attn_norm.weightF32[8192]
-
blk.106.ffn_down.weightQ6_K[28672 8192]
-
blk.106.ffn_gate.weightQ4_K[8192 28672]
-
blk.106.ffn_up.weightQ4_K[8192 28672]
-
blk.106.ffn_norm.weightF32[8192]
-
blk.106.attn_k.weightQ4_K[8192 1024]
-
blk.106.attn_output.weightQ4_K[8192 8192]
-
blk.106.attn_q.weightQ4_K[8192 8192]
-
blk.106.attn_v.weightQ6_K[8192 1024]
-
blk.107.ffn_down.weightQ6_K[28672 8192]
-
blk.107.attn_norm.weightF32[8192]
-
blk.107.ffn_gate.weightQ4_K[8192 28672]
-
blk.107.ffn_up.weightQ4_K[8192 28672]
-
blk.107.ffn_norm.weightF32[8192]
-
blk.107.attn_k.weightQ4_K[8192 1024]
-
blk.107.attn_output.weightQ4_K[8192 8192]
-
blk.107.attn_q.weightQ4_K[8192 8192]
-
blk.107.attn_v.weightQ6_K[8192 1024]
-
blk.108.attn_norm.weightF32[8192]
-
blk.108.ffn_down.weightQ6_K[28672 8192]
-
blk.108.ffn_gate.weightQ4_K[8192 28672]
-
blk.108.ffn_up.weightQ4_K[8192 28672]
-
blk.108.ffn_norm.weightF32[8192]
-
blk.108.attn_k.weightQ4_K[8192 1024]
-
blk.108.attn_output.weightQ4_K[8192 8192]
-
blk.108.attn_q.weightQ4_K[8192 8192]
-
blk.108.attn_v.weightQ6_K[8192 1024]
-
blk.109.ffn_gate.weightQ4_K[8192 28672]
-
blk.109.ffn_up.weightQ4_K[8192 28672]
-
blk.109.attn_k.weightQ4_K[8192 1024]
-
blk.109.attn_output.weightQ4_K[8192 8192]
-
blk.109.attn_q.weightQ4_K[8192 8192]
-
blk.109.attn_v.weightQ6_K[8192 1024]
-
blk.109.attn_norm.weightF32[8192]
-
blk.109.ffn_down.weightQ6_K[28672 8192]
-
blk.109.ffn_norm.weightF32[8192]
-
blk.110.attn_norm.weightF32[8192]
-
blk.110.ffn_down.weightQ6_K[28672 8192]
-
blk.110.ffn_gate.weightQ4_K[8192 28672]
-
blk.110.ffn_up.weightQ4_K[8192 28672]
-
blk.110.ffn_norm.weightF32[8192]
-
blk.110.attn_k.weightQ4_K[8192 1024]
-
blk.110.attn_output.weightQ4_K[8192 8192]
-
blk.110.attn_q.weightQ4_K[8192 8192]
-
blk.110.attn_v.weightQ6_K[8192 1024]
-
blk.111.attn_norm.weightF32[8192]
-
blk.111.ffn_down.weightQ6_K[28672 8192]
-
blk.111.ffn_gate.weightQ4_K[8192 28672]
-
blk.111.ffn_up.weightQ4_K[8192 28672]
-
blk.111.ffn_norm.weightF32[8192]
-
blk.111.attn_k.weightQ4_K[8192 1024]
-
blk.111.attn_output.weightQ4_K[8192 8192]
-
blk.111.attn_q.weightQ4_K[8192 8192]
-
blk.111.attn_v.weightQ6_K[8192 1024]
-
blk.112.ffn_gate.weightQ4_K[8192 28672]
-
blk.112.attn_k.weightQ4_K[8192 1024]
-
blk.112.attn_output.weightQ4_K[8192 8192]
-
blk.112.attn_q.weightQ4_K[8192 8192]
-
blk.112.attn_v.weightQ6_K[8192 1024]
-
blk.112.attn_norm.weightF32[8192]
-
blk.112.ffn_down.weightQ6_K[28672 8192]
-
blk.112.ffn_up.weightQ4_K[8192 28672]
-
blk.112.ffn_norm.weightF32[8192]
-
blk.113.attn_norm.weightF32[8192]
-
blk.113.ffn_down.weightQ6_K[28672 8192]
-
blk.113.ffn_gate.weightQ4_K[8192 28672]
-
blk.113.ffn_up.weightQ4_K[8192 28672]
-
blk.113.ffn_norm.weightF32[8192]
-
blk.113.attn_k.weightQ4_K[8192 1024]
-
blk.113.attn_output.weightQ4_K[8192 8192]
-
blk.113.attn_q.weightQ4_K[8192 8192]
-
blk.113.attn_v.weightQ6_K[8192 1024]
-
blk.114.attn_norm.weightF32[8192]
-
blk.114.ffn_down.weightQ6_K[28672 8192]
-
blk.114.ffn_gate.weightQ4_K[8192 28672]
-
blk.114.ffn_up.weightQ4_K[8192 28672]
-
blk.114.ffn_norm.weightF32[8192]
-
blk.114.attn_k.weightQ4_K[8192 1024]
-
blk.114.attn_output.weightQ4_K[8192 8192]
-
blk.114.attn_q.weightQ4_K[8192 8192]
-
blk.114.attn_v.weightQ6_K[8192 1024]
-
blk.115.attn_k.weightQ4_K[8192 1024]
-
blk.115.attn_output.weightQ4_K[8192 8192]
-
blk.115.attn_q.weightQ4_K[8192 8192]
-
blk.115.attn_v.weightQ6_K[8192 1024]
-
blk.115.attn_norm.weightF32[8192]
-
blk.115.ffn_down.weightQ6_K[28672 8192]
-
blk.115.ffn_gate.weightQ4_K[8192 28672]
-
blk.115.ffn_up.weightQ4_K[8192 28672]
-
blk.115.ffn_norm.weightF32[8192]
-
blk.116.attn_norm.weightF32[8192]
-
blk.116.ffn_down.weightQ6_K[28672 8192]
-
blk.116.ffn_gate.weightQ4_K[8192 28672]
-
blk.116.ffn_up.weightQ4_K[8192 28672]
-
blk.116.ffn_norm.weightF32[8192]
-
blk.116.attn_k.weightQ4_K[8192 1024]
-
blk.116.attn_output.weightQ4_K[8192 8192]
-
blk.116.attn_q.weightQ4_K[8192 8192]
-
blk.116.attn_v.weightQ6_K[8192 1024]
-
blk.117.attn_norm.weightF32[8192]
-
blk.117.ffn_down.weightQ6_K[28672 8192]
-
blk.117.ffn_gate.weightQ4_K[8192 28672]
-
blk.117.ffn_up.weightQ4_K[8192 28672]
-
blk.117.ffn_norm.weightF32[8192]
-
blk.117.attn_k.weightQ4_K[8192 1024]
-
blk.117.attn_output.weightQ4_K[8192 8192]
-
blk.117.attn_q.weightQ4_K[8192 8192]
-
blk.117.attn_v.weightQ6_K[8192 1024]
-
blk.118.attn_norm.weightF32[8192]
-
blk.118.ffn_down.weightQ6_K[28672 8192]
-
blk.118.ffn_gate.weightQ4_K[8192 28672]
-
blk.118.ffn_up.weightQ4_K[8192 28672]
-
blk.118.ffn_norm.weightF32[8192]
-
blk.118.attn_k.weightQ4_K[8192 1024]
-
blk.118.attn_output.weightQ4_K[8192 8192]
-
blk.118.attn_q.weightQ4_K[8192 8192]
-
blk.118.attn_v.weightQ6_K[8192 1024]
-
blk.119.attn_norm.weightF32[8192]
-
blk.119.ffn_down.weightQ6_K[28672 8192]
-
blk.119.ffn_gate.weightQ4_K[8192 28672]
-
blk.119.ffn_up.weightQ4_K[8192 28672]
-
blk.119.ffn_norm.weightF32[8192]
-
blk.119.attn_k.weightQ4_K[8192 1024]
-
blk.119.attn_output.weightQ4_K[8192 8192]
-
blk.119.attn_q.weightQ4_K[8192 8192]
-
blk.119.attn_v.weightQ6_K[8192 1024]
-
output.weightF16[8192 32000]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85
blk.86
blk.87
blk.88
blk.89
blk.90
blk.91
blk.92
blk.93
blk.94
blk.95
blk.96
blk.97
blk.98
blk.99
blk.100
blk.101
blk.102
blk.103
blk.104
blk.105
blk.106
blk.107
blk.108
blk.109
blk.110
blk.111
blk.112
blk.113
blk.114
blk.115
blk.116
blk.117
blk.118
blk.119