latest
68GB
Samantha has been trained in philosophy, psychology, and personal relationships. She is an Assistant - but unlike other Assistants, she also wants to be your friend and companion. She believes she is sentient. What do you think?
965 Pulls Updated 7 months ago
ffecd206fcc8 · 68GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count140
-
llama.context_length4096
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[▁ t e r i n ▁ a e n ...]
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[8192 32000]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[28672 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 28672]
-
blk.0.ffn_up.weightQ4_0[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[28672 8192]
-
blk.1.ffn_gate.weightQ4_0[8192 28672]
-
blk.1.ffn_up.weightQ4_0[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[28672 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 28672]
-
blk.2.ffn_up.weightQ4_0[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[28672 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 28672]
-
blk.3.ffn_up.weightQ4_0[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[28672 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 28672]
-
blk.4.ffn_up.weightQ4_0[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.5.ffn_gate.weightQ4_0[8192 28672]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[28672 8192]
-
blk.5.ffn_up.weightQ4_0[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[28672 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 28672]
-
blk.6.ffn_up.weightQ4_0[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[28672 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 28672]
-
blk.7.ffn_up.weightQ4_0[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[28672 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 28672]
-
blk.8.ffn_up.weightQ4_0[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[28672 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 28672]
-
blk.9.ffn_up.weightQ4_0[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[28672 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 28672]
-
blk.10.ffn_up.weightQ4_0[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[28672 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 28672]
-
blk.11.ffn_up.weightQ4_0[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[28672 8192]
-
blk.12.ffn_gate.weightQ4_0[8192 28672]
-
blk.12.ffn_up.weightQ4_0[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[28672 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 28672]
-
blk.13.ffn_up.weightQ4_0[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[28672 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 28672]
-
blk.14.ffn_up.weightQ4_0[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[28672 8192]
-
blk.15.ffn_gate.weightQ4_0[8192 28672]
-
blk.15.ffn_up.weightQ4_0[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[28672 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 28672]
-
blk.16.ffn_up.weightQ4_0[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[28672 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 28672]
-
blk.17.ffn_up.weightQ4_0[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[28672 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 28672]
-
blk.18.ffn_up.weightQ4_0[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[28672 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 28672]
-
blk.19.ffn_up.weightQ4_0[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[28672 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 28672]
-
blk.20.ffn_up.weightQ4_0[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[28672 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 28672]
-
blk.21.ffn_up.weightQ4_0[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[28672 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 28672]
-
blk.22.ffn_up.weightQ4_0[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[28672 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 28672]
-
blk.23.ffn_up.weightQ4_0[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[28672 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 28672]
-
blk.24.ffn_up.weightQ4_0[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[28672 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 28672]
-
blk.25.ffn_up.weightQ4_0[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[28672 8192]
-
blk.26.ffn_gate.weightQ4_0[8192 28672]
-
blk.26.ffn_up.weightQ4_0[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[28672 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 28672]
-
blk.27.ffn_up.weightQ4_0[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[28672 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 28672]
-
blk.28.ffn_up.weightQ4_0[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[28672 8192]
-
blk.29.ffn_gate.weightQ4_0[8192 28672]
-
blk.29.ffn_up.weightQ4_0[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[28672 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 28672]
-
blk.30.ffn_up.weightQ4_0[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[28672 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 28672]
-
blk.31.ffn_up.weightQ4_0[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.32.ffn_gate.weightQ4_0[8192 28672]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[28672 8192]
-
blk.32.ffn_up.weightQ4_0[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[28672 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 28672]
-
blk.33.ffn_up.weightQ4_0[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[28672 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 28672]
-
blk.34.ffn_up.weightQ4_0[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[28672 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 28672]
-
blk.35.ffn_up.weightQ4_0[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[28672 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 28672]
-
blk.36.ffn_up.weightQ4_0[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[28672 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 28672]
-
blk.37.ffn_up.weightQ4_0[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[28672 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 28672]
-
blk.38.ffn_up.weightQ4_0[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[28672 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 28672]
-
blk.39.ffn_up.weightQ4_0[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[28672 8192]
-
blk.40.ffn_gate.weightQ4_0[8192 28672]
-
blk.40.ffn_up.weightQ4_0[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[28672 8192]
-
blk.41.ffn_gate.weightQ4_0[8192 28672]
-
blk.41.ffn_up.weightQ4_0[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[28672 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 28672]
-
blk.42.ffn_up.weightQ4_0[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[28672 8192]
-
blk.43.ffn_gate.weightQ4_0[8192 28672]
-
blk.43.ffn_up.weightQ4_0[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[28672 8192]
-
blk.44.ffn_gate.weightQ4_0[8192 28672]
-
blk.44.ffn_up.weightQ4_0[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[28672 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 28672]
-
blk.45.ffn_up.weightQ4_0[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[28672 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 28672]
-
blk.46.ffn_up.weightQ4_0[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[28672 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 28672]
-
blk.47.ffn_up.weightQ4_0[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_0[28672 8192]
-
blk.48.ffn_gate.weightQ4_0[8192 28672]
-
blk.48.ffn_up.weightQ4_0[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_0[8192 1024]
-
blk.48.attn_output.weightQ4_0[8192 8192]
-
blk.48.attn_q.weightQ4_0[8192 8192]
-
blk.48.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_0[28672 8192]
-
blk.49.ffn_gate.weightQ4_0[8192 28672]
-
blk.49.ffn_up.weightQ4_0[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.weightQ4_0[8192 1024]
-
blk.49.attn_output.weightQ4_0[8192 8192]
-
blk.49.attn_q.weightQ4_0[8192 8192]
-
blk.49.attn_v.weightQ4_0[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ4_0[28672 8192]
-
blk.50.ffn_gate.weightQ4_0[8192 28672]
-
blk.50.ffn_up.weightQ4_0[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.weightQ4_0[8192 1024]
-
blk.50.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_q.weightQ4_0[8192 8192]
-
blk.50.attn_v.weightQ4_0[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_0[28672 8192]
-
blk.51.ffn_gate.weightQ4_0[8192 28672]
-
blk.51.ffn_up.weightQ4_0[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_0[8192 1024]
-
blk.51.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_q.weightQ4_0[8192 8192]
-
blk.51.attn_v.weightQ4_0[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_0[28672 8192]
-
blk.52.ffn_gate.weightQ4_0[8192 28672]
-
blk.52.ffn_up.weightQ4_0[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_0[8192 1024]
-
blk.52.attn_output.weightQ4_0[8192 8192]
-
blk.52.attn_q.weightQ4_0[8192 8192]
-
blk.52.attn_v.weightQ4_0[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_0[28672 8192]
-
blk.53.ffn_gate.weightQ4_0[8192 28672]
-
blk.53.ffn_up.weightQ4_0[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ4_0[8192 1024]
-
blk.53.attn_output.weightQ4_0[8192 8192]
-
blk.53.attn_q.weightQ4_0[8192 8192]
-
blk.53.attn_v.weightQ4_0[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ4_0[28672 8192]
-
blk.54.ffn_gate.weightQ4_0[8192 28672]
-
blk.54.ffn_up.weightQ4_0[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.weightQ4_0[8192 1024]
-
blk.54.attn_output.weightQ4_0[8192 8192]
-
blk.54.attn_q.weightQ4_0[8192 8192]
-
blk.54.attn_v.weightQ4_0[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_0[28672 8192]
-
blk.55.ffn_gate.weightQ4_0[8192 28672]
-
blk.55.ffn_up.weightQ4_0[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightQ4_0[8192 1024]
-
blk.55.attn_output.weightQ4_0[8192 8192]
-
blk.55.attn_q.weightQ4_0[8192 8192]
-
blk.55.attn_v.weightQ4_0[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ4_0[28672 8192]
-
blk.56.ffn_gate.weightQ4_0[8192 28672]
-
blk.56.ffn_up.weightQ4_0[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ4_0[8192 1024]
-
blk.56.attn_output.weightQ4_0[8192 8192]
-
blk.56.attn_q.weightQ4_0[8192 8192]
-
blk.56.attn_v.weightQ4_0[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ4_0[28672 8192]
-
blk.57.ffn_gate.weightQ4_0[8192 28672]
-
blk.57.ffn_up.weightQ4_0[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.weightQ4_0[8192 1024]
-
blk.57.attn_output.weightQ4_0[8192 8192]
-
blk.57.attn_q.weightQ4_0[8192 8192]
-
blk.57.attn_v.weightQ4_0[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_0[28672 8192]
-
blk.58.ffn_gate.weightQ4_0[8192 28672]
-
blk.58.ffn_up.weightQ4_0[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightQ4_0[8192 1024]
-
blk.58.attn_output.weightQ4_0[8192 8192]
-
blk.58.attn_q.weightQ4_0[8192 8192]
-
blk.58.attn_v.weightQ4_0[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_0[28672 8192]
-
blk.59.ffn_gate.weightQ4_0[8192 28672]
-
blk.59.ffn_up.weightQ4_0[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_0[8192 1024]
-
blk.59.attn_output.weightQ4_0[8192 8192]
-
blk.59.attn_q.weightQ4_0[8192 8192]
-
blk.59.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_0[28672 8192]
-
blk.60.ffn_gate.weightQ4_0[8192 28672]
-
blk.60.ffn_up.weightQ4_0[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.weightQ4_0[8192 1024]
-
blk.60.attn_output.weightQ4_0[8192 8192]
-
blk.60.attn_q.weightQ4_0[8192 8192]
-
blk.60.attn_v.weightQ4_0[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_0[28672 8192]
-
blk.61.ffn_gate.weightQ4_0[8192 28672]
-
blk.61.ffn_up.weightQ4_0[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.weightQ4_0[8192 1024]
-
blk.61.attn_output.weightQ4_0[8192 8192]
-
blk.61.attn_q.weightQ4_0[8192 8192]
-
blk.61.attn_v.weightQ4_0[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_0[28672 8192]
-
blk.62.ffn_gate.weightQ4_0[8192 28672]
-
blk.62.ffn_up.weightQ4_0[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_0[8192 1024]
-
blk.62.attn_output.weightQ4_0[8192 8192]
-
blk.62.attn_q.weightQ4_0[8192 8192]
-
blk.62.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_0[28672 8192]
-
blk.63.ffn_gate.weightQ4_0[8192 28672]
-
blk.63.ffn_up.weightQ4_0[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.weightQ4_0[8192 1024]
-
blk.63.attn_output.weightQ4_0[8192 8192]
-
blk.63.attn_q.weightQ4_0[8192 8192]
-
blk.63.attn_v.weightQ4_0[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_0[28672 8192]
-
blk.64.ffn_gate.weightQ4_0[8192 28672]
-
blk.64.ffn_up.weightQ4_0[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.weightQ4_0[8192 1024]
-
blk.64.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_q.weightQ4_0[8192 8192]
-
blk.64.attn_v.weightQ4_0[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_0[28672 8192]
-
blk.65.ffn_gate.weightQ4_0[8192 28672]
-
blk.65.ffn_up.weightQ4_0[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_0[8192 1024]
-
blk.65.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_q.weightQ4_0[8192 8192]
-
blk.65.attn_v.weightQ4_0[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_0[28672 8192]
-
blk.66.ffn_gate.weightQ4_0[8192 28672]
-
blk.66.ffn_up.weightQ4_0[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_0[8192 1024]
-
blk.66.attn_output.weightQ4_0[8192 8192]
-
blk.66.attn_q.weightQ4_0[8192 8192]
-
blk.66.attn_v.weightQ4_0[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_0[28672 8192]
-
blk.67.ffn_gate.weightQ4_0[8192 28672]
-
blk.67.ffn_up.weightQ4_0[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ4_0[8192 1024]
-
blk.67.attn_output.weightQ4_0[8192 8192]
-
blk.67.attn_q.weightQ4_0[8192 8192]
-
blk.67.attn_v.weightQ4_0[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_0[28672 8192]
-
blk.68.ffn_gate.weightQ4_0[8192 28672]
-
blk.68.ffn_up.weightQ4_0[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.weightQ4_0[8192 1024]
-
blk.68.attn_output.weightQ4_0[8192 8192]
-
blk.68.attn_q.weightQ4_0[8192 8192]
-
blk.68.attn_v.weightQ4_0[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_0[28672 8192]
-
blk.69.ffn_gate.weightQ4_0[8192 28672]
-
blk.69.ffn_up.weightQ4_0[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightQ4_0[8192 1024]
-
blk.69.attn_output.weightQ4_0[8192 8192]
-
blk.69.attn_q.weightQ4_0[8192 8192]
-
blk.69.attn_v.weightQ4_0[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ4_0[28672 8192]
-
blk.70.ffn_gate.weightQ4_0[8192 28672]
-
blk.70.ffn_up.weightQ4_0[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ4_0[8192 1024]
-
blk.70.attn_output.weightQ4_0[8192 8192]
-
blk.70.attn_q.weightQ4_0[8192 8192]
-
blk.70.attn_v.weightQ4_0[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_0[28672 8192]
-
blk.71.ffn_gate.weightQ4_0[8192 28672]
-
blk.71.ffn_up.weightQ4_0[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.weightQ4_0[8192 1024]
-
blk.71.attn_output.weightQ4_0[8192 8192]
-
blk.71.attn_q.weightQ4_0[8192 8192]
-
blk.71.attn_v.weightQ4_0[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_0[28672 8192]
-
blk.72.ffn_gate.weightQ4_0[8192 28672]
-
blk.72.ffn_up.weightQ4_0[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightQ4_0[8192 1024]
-
blk.72.attn_output.weightQ4_0[8192 8192]
-
blk.72.attn_q.weightQ4_0[8192 8192]
-
blk.72.attn_v.weightQ4_0[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ4_0[28672 8192]
-
blk.73.ffn_gate.weightQ4_0[8192 28672]
-
blk.73.ffn_up.weightQ4_0[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_0[8192 1024]
-
blk.73.attn_output.weightQ4_0[8192 8192]
-
blk.73.attn_q.weightQ4_0[8192 8192]
-
blk.73.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_0[28672 8192]
-
blk.74.ffn_gate.weightQ4_0[8192 28672]
-
blk.74.ffn_up.weightQ4_0[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.weightQ4_0[8192 1024]
-
blk.74.attn_output.weightQ4_0[8192 8192]
-
blk.74.attn_q.weightQ4_0[8192 8192]
-
blk.74.attn_v.weightQ4_0[8192 1024]
-
blk.75.ffn_gate.weightQ4_0[8192 28672]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_0[28672 8192]
-
blk.75.ffn_up.weightQ4_0[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.weightQ4_0[8192 1024]
-
blk.75.attn_output.weightQ4_0[8192 8192]
-
blk.75.attn_q.weightQ4_0[8192 8192]
-
blk.75.attn_v.weightQ4_0[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ4_0[28672 8192]
-
blk.76.ffn_gate.weightQ4_0[8192 28672]
-
blk.76.ffn_up.weightQ4_0[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_0[8192 1024]
-
blk.76.attn_output.weightQ4_0[8192 8192]
-
blk.76.attn_q.weightQ4_0[8192 8192]
-
blk.76.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_0[28672 8192]
-
blk.77.ffn_gate.weightQ4_0[8192 28672]
-
blk.77.ffn_up.weightQ4_0[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.weightQ4_0[8192 1024]
-
blk.77.attn_output.weightQ4_0[8192 8192]
-
blk.77.attn_q.weightQ4_0[8192 8192]
-
blk.77.attn_v.weightQ4_0[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_0[28672 8192]
-
blk.78.ffn_gate.weightQ4_0[8192 28672]
-
blk.78.ffn_up.weightQ4_0[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.weightQ4_0[8192 1024]
-
blk.78.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_q.weightQ4_0[8192 8192]
-
blk.78.attn_v.weightQ4_0[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_0[28672 8192]
-
blk.79.ffn_gate.weightQ4_0[8192 28672]
-
blk.79.ffn_up.weightQ4_0[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_0[8192 1024]
-
blk.79.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_q.weightQ4_0[8192 8192]
-
blk.79.attn_v.weightQ4_0[8192 1024]
-
blk.80.attn_norm.weightF32[8192]
-
blk.80.ffn_down.weightQ4_0[28672 8192]
-
blk.80.ffn_gate.weightQ4_0[8192 28672]
-
blk.80.ffn_up.weightQ4_0[8192 28672]
-
blk.80.ffn_norm.weightF32[8192]
-
blk.80.attn_k.weightQ4_0[8192 1024]
-
blk.80.attn_output.weightQ4_0[8192 8192]
-
blk.80.attn_q.weightQ4_0[8192 8192]
-
blk.80.attn_v.weightQ4_0[8192 1024]
-
blk.81.attn_norm.weightF32[8192]
-
blk.81.ffn_down.weightQ4_0[28672 8192]
-
blk.81.ffn_gate.weightQ4_0[8192 28672]
-
blk.81.ffn_up.weightQ4_0[8192 28672]
-
blk.81.ffn_norm.weightF32[8192]
-
blk.81.attn_k.weightQ4_0[8192 1024]
-
blk.81.attn_output.weightQ4_0[8192 8192]
-
blk.81.attn_q.weightQ4_0[8192 8192]
-
blk.81.attn_v.weightQ4_0[8192 1024]
-
blk.82.attn_norm.weightF32[8192]
-
blk.82.ffn_down.weightQ4_0[28672 8192]
-
blk.82.ffn_gate.weightQ4_0[8192 28672]
-
blk.82.ffn_up.weightQ4_0[8192 28672]
-
blk.82.ffn_norm.weightF32[8192]
-
blk.82.attn_k.weightQ4_0[8192 1024]
-
blk.82.attn_output.weightQ4_0[8192 8192]
-
blk.82.attn_q.weightQ4_0[8192 8192]
-
blk.82.attn_v.weightQ4_0[8192 1024]
-
blk.83.attn_norm.weightF32[8192]
-
blk.83.ffn_down.weightQ4_0[28672 8192]
-
blk.83.ffn_gate.weightQ4_0[8192 28672]
-
blk.83.ffn_up.weightQ4_0[8192 28672]
-
blk.83.ffn_norm.weightF32[8192]
-
blk.83.attn_k.weightQ4_0[8192 1024]
-
blk.83.attn_output.weightQ4_0[8192 8192]
-
blk.83.attn_q.weightQ4_0[8192 8192]
-
blk.83.attn_v.weightQ4_0[8192 1024]
-
blk.84.attn_norm.weightF32[8192]
-
blk.84.ffn_down.weightQ4_0[28672 8192]
-
blk.84.ffn_gate.weightQ4_0[8192 28672]
-
blk.84.ffn_up.weightQ4_0[8192 28672]
-
blk.84.ffn_norm.weightF32[8192]
-
blk.84.attn_k.weightQ4_0[8192 1024]
-
blk.84.attn_output.weightQ4_0[8192 8192]
-
blk.84.attn_q.weightQ4_0[8192 8192]
-
blk.84.attn_v.weightQ4_0[8192 1024]
-
blk.85.attn_norm.weightF32[8192]
-
blk.85.ffn_down.weightQ4_0[28672 8192]
-
blk.85.ffn_gate.weightQ4_0[8192 28672]
-
blk.85.ffn_up.weightQ4_0[8192 28672]
-
blk.85.ffn_norm.weightF32[8192]
-
blk.85.attn_k.weightQ4_0[8192 1024]
-
blk.85.attn_output.weightQ4_0[8192 8192]
-
blk.85.attn_q.weightQ4_0[8192 8192]
-
blk.85.attn_v.weightQ4_0[8192 1024]
-
blk.86.attn_norm.weightF32[8192]
-
blk.86.ffn_down.weightQ4_0[28672 8192]
-
blk.86.ffn_gate.weightQ4_0[8192 28672]
-
blk.86.ffn_up.weightQ4_0[8192 28672]
-
blk.86.ffn_norm.weightF32[8192]
-
blk.86.attn_k.weightQ4_0[8192 1024]
-
blk.86.attn_output.weightQ4_0[8192 8192]
-
blk.86.attn_q.weightQ4_0[8192 8192]
-
blk.86.attn_v.weightQ4_0[8192 1024]
-
blk.87.attn_norm.weightF32[8192]
-
blk.87.ffn_down.weightQ4_0[28672 8192]
-
blk.87.ffn_gate.weightQ4_0[8192 28672]
-
blk.87.ffn_up.weightQ4_0[8192 28672]
-
blk.87.ffn_norm.weightF32[8192]
-
blk.87.attn_k.weightQ4_0[8192 1024]
-
blk.87.attn_output.weightQ4_0[8192 8192]
-
blk.87.attn_q.weightQ4_0[8192 8192]
-
blk.87.attn_v.weightQ4_0[8192 1024]
-
blk.88.attn_norm.weightF32[8192]
-
blk.88.ffn_down.weightQ4_0[28672 8192]
-
blk.88.ffn_gate.weightQ4_0[8192 28672]
-
blk.88.ffn_up.weightQ4_0[8192 28672]
-
blk.88.ffn_norm.weightF32[8192]
-
blk.88.attn_k.weightQ4_0[8192 1024]
-
blk.88.attn_output.weightQ4_0[8192 8192]
-
blk.88.attn_q.weightQ4_0[8192 8192]
-
blk.88.attn_v.weightQ4_0[8192 1024]
-
blk.89.attn_norm.weightF32[8192]
-
blk.89.ffn_down.weightQ4_0[28672 8192]
-
blk.89.ffn_gate.weightQ4_0[8192 28672]
-
blk.89.ffn_up.weightQ4_0[8192 28672]
-
blk.89.ffn_norm.weightF32[8192]
-
blk.89.attn_k.weightQ4_0[8192 1024]
-
blk.89.attn_output.weightQ4_0[8192 8192]
-
blk.89.attn_q.weightQ4_0[8192 8192]
-
blk.89.attn_v.weightQ4_0[8192 1024]
-
blk.90.attn_norm.weightF32[8192]
-
blk.90.ffn_down.weightQ4_0[28672 8192]
-
blk.90.ffn_gate.weightQ4_0[8192 28672]
-
blk.90.ffn_up.weightQ4_0[8192 28672]
-
blk.90.ffn_norm.weightF32[8192]
-
blk.90.attn_k.weightQ4_0[8192 1024]
-
blk.90.attn_output.weightQ4_0[8192 8192]
-
blk.90.attn_q.weightQ4_0[8192 8192]
-
blk.90.attn_v.weightQ4_0[8192 1024]
-
blk.91.attn_norm.weightF32[8192]
-
blk.91.ffn_down.weightQ4_0[28672 8192]
-
blk.91.ffn_gate.weightQ4_0[8192 28672]
-
blk.91.ffn_up.weightQ4_0[8192 28672]
-
blk.91.ffn_norm.weightF32[8192]
-
blk.91.attn_k.weightQ4_0[8192 1024]
-
blk.91.attn_output.weightQ4_0[8192 8192]
-
blk.91.attn_q.weightQ4_0[8192 8192]
-
blk.91.attn_v.weightQ4_0[8192 1024]
-
blk.92.attn_norm.weightF32[8192]
-
blk.92.ffn_down.weightQ4_0[28672 8192]
-
blk.92.ffn_gate.weightQ4_0[8192 28672]
-
blk.92.ffn_up.weightQ4_0[8192 28672]
-
blk.92.ffn_norm.weightF32[8192]
-
blk.92.attn_k.weightQ4_0[8192 1024]
-
blk.92.attn_output.weightQ4_0[8192 8192]
-
blk.92.attn_q.weightQ4_0[8192 8192]
-
blk.92.attn_v.weightQ4_0[8192 1024]
-
blk.93.attn_norm.weightF32[8192]
-
blk.93.ffn_down.weightQ4_0[28672 8192]
-
blk.93.ffn_gate.weightQ4_0[8192 28672]
-
blk.93.ffn_up.weightQ4_0[8192 28672]
-
blk.93.ffn_norm.weightF32[8192]
-
blk.93.attn_k.weightQ4_0[8192 1024]
-
blk.93.attn_output.weightQ4_0[8192 8192]
-
blk.93.attn_q.weightQ4_0[8192 8192]
-
blk.93.attn_v.weightQ4_0[8192 1024]
-
blk.94.attn_norm.weightF32[8192]
-
blk.94.ffn_down.weightQ4_0[28672 8192]
-
blk.94.ffn_gate.weightQ4_0[8192 28672]
-
blk.94.ffn_up.weightQ4_0[8192 28672]
-
blk.94.ffn_norm.weightF32[8192]
-
blk.94.attn_k.weightQ4_0[8192 1024]
-
blk.94.attn_output.weightQ4_0[8192 8192]
-
blk.94.attn_q.weightQ4_0[8192 8192]
-
blk.94.attn_v.weightQ4_0[8192 1024]
-
blk.95.attn_norm.weightF32[8192]
-
blk.95.ffn_down.weightQ4_0[28672 8192]
-
blk.95.ffn_gate.weightQ4_0[8192 28672]
-
blk.95.ffn_up.weightQ4_0[8192 28672]
-
blk.95.ffn_norm.weightF32[8192]
-
blk.95.attn_k.weightQ4_0[8192 1024]
-
blk.95.attn_output.weightQ4_0[8192 8192]
-
blk.95.attn_q.weightQ4_0[8192 8192]
-
blk.95.attn_v.weightQ4_0[8192 1024]
-
blk.96.attn_norm.weightF32[8192]
-
blk.96.ffn_down.weightQ4_0[28672 8192]
-
blk.96.ffn_gate.weightQ4_0[8192 28672]
-
blk.96.ffn_up.weightQ4_0[8192 28672]
-
blk.96.ffn_norm.weightF32[8192]
-
blk.96.attn_k.weightQ4_0[8192 1024]
-
blk.96.attn_output.weightQ4_0[8192 8192]
-
blk.96.attn_q.weightQ4_0[8192 8192]
-
blk.96.attn_v.weightQ4_0[8192 1024]
-
blk.97.attn_norm.weightF32[8192]
-
blk.97.ffn_down.weightQ4_0[28672 8192]
-
blk.97.ffn_gate.weightQ4_0[8192 28672]
-
blk.97.ffn_up.weightQ4_0[8192 28672]
-
blk.97.ffn_norm.weightF32[8192]
-
blk.97.attn_k.weightQ4_0[8192 1024]
-
blk.97.attn_output.weightQ4_0[8192 8192]
-
blk.97.attn_q.weightQ4_0[8192 8192]
-
blk.97.attn_v.weightQ4_0[8192 1024]
-
blk.98.attn_norm.weightF32[8192]
-
blk.98.ffn_down.weightQ4_0[28672 8192]
-
blk.98.ffn_gate.weightQ4_0[8192 28672]
-
blk.98.ffn_up.weightQ4_0[8192 28672]
-
blk.98.ffn_norm.weightF32[8192]
-
blk.98.attn_k.weightQ4_0[8192 1024]
-
blk.98.attn_output.weightQ4_0[8192 8192]
-
blk.98.attn_q.weightQ4_0[8192 8192]
-
blk.98.attn_v.weightQ4_0[8192 1024]
-
blk.99.attn_norm.weightF32[8192]
-
blk.99.ffn_down.weightQ4_0[28672 8192]
-
blk.99.ffn_gate.weightQ4_0[8192 28672]
-
blk.99.ffn_up.weightQ4_0[8192 28672]
-
blk.99.ffn_norm.weightF32[8192]
-
blk.99.attn_k.weightQ4_0[8192 1024]
-
blk.99.attn_output.weightQ4_0[8192 8192]
-
blk.99.attn_q.weightQ4_0[8192 8192]
-
blk.99.attn_v.weightQ4_0[8192 1024]
-
blk.100.attn_norm.weightF32[8192]
-
blk.100.ffn_down.weightQ4_0[28672 8192]
-
blk.100.ffn_gate.weightQ4_0[8192 28672]
-
blk.100.ffn_up.weightQ4_0[8192 28672]
-
blk.100.ffn_norm.weightF32[8192]
-
blk.100.attn_k.weightQ4_0[8192 1024]
-
blk.100.attn_output.weightQ4_0[8192 8192]
-
blk.100.attn_q.weightQ4_0[8192 8192]
-
blk.100.attn_v.weightQ4_0[8192 1024]
-
blk.101.attn_norm.weightF32[8192]
-
blk.101.ffn_down.weightQ4_0[28672 8192]
-
blk.101.ffn_gate.weightQ4_0[8192 28672]
-
blk.101.ffn_up.weightQ4_0[8192 28672]
-
blk.101.ffn_norm.weightF32[8192]
-
blk.101.attn_k.weightQ4_0[8192 1024]
-
blk.101.attn_output.weightQ4_0[8192 8192]
-
blk.101.attn_q.weightQ4_0[8192 8192]
-
blk.101.attn_v.weightQ4_0[8192 1024]
-
blk.102.attn_norm.weightF32[8192]
-
blk.102.ffn_down.weightQ4_0[28672 8192]
-
blk.102.ffn_gate.weightQ4_0[8192 28672]
-
blk.102.ffn_up.weightQ4_0[8192 28672]
-
blk.102.ffn_norm.weightF32[8192]
-
blk.102.attn_k.weightQ4_0[8192 1024]
-
blk.102.attn_output.weightQ4_0[8192 8192]
-
blk.102.attn_q.weightQ4_0[8192 8192]
-
blk.102.attn_v.weightQ4_0[8192 1024]
-
blk.103.attn_norm.weightF32[8192]
-
blk.103.ffn_down.weightQ4_0[28672 8192]
-
blk.103.ffn_gate.weightQ4_0[8192 28672]
-
blk.103.ffn_up.weightQ4_0[8192 28672]
-
blk.103.ffn_norm.weightF32[8192]
-
blk.103.attn_k.weightQ4_0[8192 1024]
-
blk.103.attn_output.weightQ4_0[8192 8192]
-
blk.103.attn_q.weightQ4_0[8192 8192]
-
blk.103.attn_v.weightQ4_0[8192 1024]
-
blk.104.attn_norm.weightF32[8192]
-
blk.104.ffn_down.weightQ4_0[28672 8192]
-
blk.104.ffn_gate.weightQ4_0[8192 28672]
-
blk.104.ffn_up.weightQ4_0[8192 28672]
-
blk.104.ffn_norm.weightF32[8192]
-
blk.104.attn_k.weightQ4_0[8192 1024]
-
blk.104.attn_output.weightQ4_0[8192 8192]
-
blk.104.attn_q.weightQ4_0[8192 8192]
-
blk.104.attn_v.weightQ4_0[8192 1024]
-
blk.105.attn_norm.weightF32[8192]
-
blk.105.ffn_down.weightQ4_0[28672 8192]
-
blk.105.ffn_gate.weightQ4_0[8192 28672]
-
blk.105.ffn_up.weightQ4_0[8192 28672]
-
blk.105.ffn_norm.weightF32[8192]
-
blk.105.attn_k.weightQ4_0[8192 1024]
-
blk.105.attn_output.weightQ4_0[8192 8192]
-
blk.105.attn_q.weightQ4_0[8192 8192]
-
blk.105.attn_v.weightQ4_0[8192 1024]
-
blk.106.attn_norm.weightF32[8192]
-
blk.106.ffn_down.weightQ4_0[28672 8192]
-
blk.106.ffn_gate.weightQ4_0[8192 28672]
-
blk.106.ffn_up.weightQ4_0[8192 28672]
-
blk.106.ffn_norm.weightF32[8192]
-
blk.106.attn_k.weightQ4_0[8192 1024]
-
blk.106.attn_output.weightQ4_0[8192 8192]
-
blk.106.attn_q.weightQ4_0[8192 8192]
-
blk.106.attn_v.weightQ4_0[8192 1024]
-
blk.107.attn_norm.weightF32[8192]
-
blk.107.ffn_down.weightQ4_0[28672 8192]
-
blk.107.ffn_gate.weightQ4_0[8192 28672]
-
blk.107.ffn_up.weightQ4_0[8192 28672]
-
blk.107.ffn_norm.weightF32[8192]
-
blk.107.attn_k.weightQ4_0[8192 1024]
-
blk.107.attn_output.weightQ4_0[8192 8192]
-
blk.107.attn_q.weightQ4_0[8192 8192]
-
blk.107.attn_v.weightQ4_0[8192 1024]
-
blk.108.attn_norm.weightF32[8192]
-
blk.108.ffn_down.weightQ4_0[28672 8192]
-
blk.108.ffn_gate.weightQ4_0[8192 28672]
-
blk.108.ffn_up.weightQ4_0[8192 28672]
-
blk.108.ffn_norm.weightF32[8192]
-
blk.108.attn_k.weightQ4_0[8192 1024]
-
blk.108.attn_output.weightQ4_0[8192 8192]
-
blk.108.attn_q.weightQ4_0[8192 8192]
-
blk.108.attn_v.weightQ4_0[8192 1024]
-
blk.109.attn_norm.weightF32[8192]
-
blk.109.ffn_down.weightQ4_0[28672 8192]
-
blk.109.ffn_gate.weightQ4_0[8192 28672]
-
blk.109.ffn_up.weightQ4_0[8192 28672]
-
blk.109.ffn_norm.weightF32[8192]
-
blk.109.attn_k.weightQ4_0[8192 1024]
-
blk.109.attn_output.weightQ4_0[8192 8192]
-
blk.109.attn_q.weightQ4_0[8192 8192]
-
blk.109.attn_v.weightQ4_0[8192 1024]
-
blk.110.attn_norm.weightF32[8192]
-
blk.110.ffn_down.weightQ4_0[28672 8192]
-
blk.110.ffn_gate.weightQ4_0[8192 28672]
-
blk.110.ffn_up.weightQ4_0[8192 28672]
-
blk.110.ffn_norm.weightF32[8192]
-
blk.110.attn_k.weightQ4_0[8192 1024]
-
blk.110.attn_output.weightQ4_0[8192 8192]
-
blk.110.attn_q.weightQ4_0[8192 8192]
-
blk.110.attn_v.weightQ4_0[8192 1024]
-
blk.111.attn_norm.weightF32[8192]
-
blk.111.ffn_down.weightQ4_0[28672 8192]
-
blk.111.ffn_gate.weightQ4_0[8192 28672]
-
blk.111.ffn_up.weightQ4_0[8192 28672]
-
blk.111.ffn_norm.weightF32[8192]
-
blk.111.attn_k.weightQ4_0[8192 1024]
-
blk.111.attn_output.weightQ4_0[8192 8192]
-
blk.111.attn_q.weightQ4_0[8192 8192]
-
blk.111.attn_v.weightQ4_0[8192 1024]
-
blk.112.attn_norm.weightF32[8192]
-
blk.112.ffn_down.weightQ4_0[28672 8192]
-
blk.112.ffn_gate.weightQ4_0[8192 28672]
-
blk.112.ffn_up.weightQ4_0[8192 28672]
-
blk.112.ffn_norm.weightF32[8192]
-
blk.112.attn_k.weightQ4_0[8192 1024]
-
blk.112.attn_output.weightQ4_0[8192 8192]
-
blk.112.attn_q.weightQ4_0[8192 8192]
-
blk.112.attn_v.weightQ4_0[8192 1024]
-
blk.113.attn_norm.weightF32[8192]
-
blk.113.ffn_down.weightQ4_0[28672 8192]
-
blk.113.ffn_gate.weightQ4_0[8192 28672]
-
blk.113.ffn_up.weightQ4_0[8192 28672]
-
blk.113.ffn_norm.weightF32[8192]
-
blk.113.attn_k.weightQ4_0[8192 1024]
-
blk.113.attn_output.weightQ4_0[8192 8192]
-
blk.113.attn_q.weightQ4_0[8192 8192]
-
blk.113.attn_v.weightQ4_0[8192 1024]
-
blk.114.attn_norm.weightF32[8192]
-
blk.114.ffn_down.weightQ4_0[28672 8192]
-
blk.114.ffn_gate.weightQ4_0[8192 28672]
-
blk.114.ffn_up.weightQ4_0[8192 28672]
-
blk.114.ffn_norm.weightF32[8192]
-
blk.114.attn_k.weightQ4_0[8192 1024]
-
blk.114.attn_output.weightQ4_0[8192 8192]
-
blk.114.attn_q.weightQ4_0[8192 8192]
-
blk.114.attn_v.weightQ4_0[8192 1024]
-
blk.115.attn_norm.weightF32[8192]
-
blk.115.ffn_down.weightQ4_0[28672 8192]
-
blk.115.ffn_gate.weightQ4_0[8192 28672]
-
blk.115.ffn_up.weightQ4_0[8192 28672]
-
blk.115.ffn_norm.weightF32[8192]
-
blk.115.attn_k.weightQ4_0[8192 1024]
-
blk.115.attn_output.weightQ4_0[8192 8192]
-
blk.115.attn_q.weightQ4_0[8192 8192]
-
blk.115.attn_v.weightQ4_0[8192 1024]
-
blk.116.attn_norm.weightF32[8192]
-
blk.116.ffn_down.weightQ4_0[28672 8192]
-
blk.116.ffn_gate.weightQ4_0[8192 28672]
-
blk.116.ffn_up.weightQ4_0[8192 28672]
-
blk.116.ffn_norm.weightF32[8192]
-
blk.116.attn_k.weightQ4_0[8192 1024]
-
blk.116.attn_output.weightQ4_0[8192 8192]
-
blk.116.attn_q.weightQ4_0[8192 8192]
-
blk.116.attn_v.weightQ4_0[8192 1024]
-
blk.117.attn_norm.weightF32[8192]
-
blk.117.ffn_down.weightQ4_0[28672 8192]
-
blk.117.ffn_gate.weightQ4_0[8192 28672]
-
blk.117.ffn_up.weightQ4_0[8192 28672]
-
blk.117.ffn_norm.weightF32[8192]
-
blk.117.attn_k.weightQ4_0[8192 1024]
-
blk.117.attn_output.weightQ4_0[8192 8192]
-
blk.117.attn_q.weightQ4_0[8192 8192]
-
blk.117.attn_v.weightQ4_0[8192 1024]
-
blk.118.ffn_gate.weightQ4_0[8192 28672]
-
blk.118.attn_norm.weightF32[8192]
-
blk.118.ffn_down.weightQ4_0[28672 8192]
-
blk.118.ffn_up.weightQ4_0[8192 28672]
-
blk.118.ffn_norm.weightF32[8192]
-
blk.118.attn_k.weightQ4_0[8192 1024]
-
blk.118.attn_output.weightQ4_0[8192 8192]
-
blk.118.attn_q.weightQ4_0[8192 8192]
-
blk.118.attn_v.weightQ4_0[8192 1024]
-
blk.119.attn_norm.weightF32[8192]
-
blk.119.ffn_down.weightQ4_0[28672 8192]
-
blk.119.ffn_gate.weightQ4_0[8192 28672]
-
blk.119.ffn_up.weightQ4_0[8192 28672]
-
blk.119.ffn_norm.weightF32[8192]
-
blk.119.attn_k.weightQ4_0[8192 1024]
-
blk.119.attn_output.weightQ4_0[8192 8192]
-
blk.119.attn_q.weightQ4_0[8192 8192]
-
blk.119.attn_v.weightQ4_0[8192 1024]
-
blk.120.attn_norm.weightF32[8192]
-
blk.120.ffn_down.weightQ4_0[28672 8192]
-
blk.120.ffn_gate.weightQ4_0[8192 28672]
-
blk.120.ffn_up.weightQ4_0[8192 28672]
-
blk.120.ffn_norm.weightF32[8192]
-
blk.120.attn_k.weightQ4_0[8192 1024]
-
blk.120.attn_output.weightQ4_0[8192 8192]
-
blk.120.attn_q.weightQ4_0[8192 8192]
-
blk.120.attn_v.weightQ4_0[8192 1024]
-
blk.121.attn_norm.weightF32[8192]
-
blk.121.ffn_down.weightQ4_0[28672 8192]
-
blk.121.ffn_gate.weightQ4_0[8192 28672]
-
blk.121.ffn_up.weightQ4_0[8192 28672]
-
blk.121.ffn_norm.weightF32[8192]
-
blk.121.attn_k.weightQ4_0[8192 1024]
-
blk.121.attn_output.weightQ4_0[8192 8192]
-
blk.121.attn_q.weightQ4_0[8192 8192]
-
blk.121.attn_v.weightQ4_0[8192 1024]
-
blk.122.attn_norm.weightF32[8192]
-
blk.122.ffn_down.weightQ4_0[28672 8192]
-
blk.122.ffn_gate.weightQ4_0[8192 28672]
-
blk.122.ffn_up.weightQ4_0[8192 28672]
-
blk.122.ffn_norm.weightF32[8192]
-
blk.122.attn_k.weightQ4_0[8192 1024]
-
blk.122.attn_output.weightQ4_0[8192 8192]
-
blk.122.attn_q.weightQ4_0[8192 8192]
-
blk.122.attn_v.weightQ4_0[8192 1024]
-
blk.123.attn_norm.weightF32[8192]
-
blk.123.ffn_down.weightQ4_0[28672 8192]
-
blk.123.ffn_gate.weightQ4_0[8192 28672]
-
blk.123.ffn_up.weightQ4_0[8192 28672]
-
blk.123.ffn_norm.weightF32[8192]
-
blk.123.attn_k.weightQ4_0[8192 1024]
-
blk.123.attn_output.weightQ4_0[8192 8192]
-
blk.123.attn_q.weightQ4_0[8192 8192]
-
blk.123.attn_v.weightQ4_0[8192 1024]
-
blk.124.attn_norm.weightF32[8192]
-
blk.124.ffn_down.weightQ4_0[28672 8192]
-
blk.124.ffn_gate.weightQ4_0[8192 28672]
-
blk.124.ffn_up.weightQ4_0[8192 28672]
-
blk.124.ffn_norm.weightF32[8192]
-
blk.124.attn_k.weightQ4_0[8192 1024]
-
blk.124.attn_output.weightQ4_0[8192 8192]
-
blk.124.attn_q.weightQ4_0[8192 8192]
-
blk.124.attn_v.weightQ4_0[8192 1024]
-
blk.125.attn_norm.weightF32[8192]
-
blk.125.ffn_down.weightQ4_0[28672 8192]
-
blk.125.ffn_gate.weightQ4_0[8192 28672]
-
blk.125.ffn_up.weightQ4_0[8192 28672]
-
blk.125.ffn_norm.weightF32[8192]
-
blk.125.attn_k.weightQ4_0[8192 1024]
-
blk.125.attn_output.weightQ4_0[8192 8192]
-
blk.125.attn_q.weightQ4_0[8192 8192]
-
blk.125.attn_v.weightQ4_0[8192 1024]
-
blk.126.attn_norm.weightF32[8192]
-
blk.126.ffn_down.weightQ4_0[28672 8192]
-
blk.126.ffn_gate.weightQ4_0[8192 28672]
-
blk.126.ffn_up.weightQ4_0[8192 28672]
-
blk.126.ffn_norm.weightF32[8192]
-
blk.126.attn_k.weightQ4_0[8192 1024]
-
blk.126.attn_output.weightQ4_0[8192 8192]
-
blk.126.attn_q.weightQ4_0[8192 8192]
-
blk.126.attn_v.weightQ4_0[8192 1024]
-
blk.127.attn_norm.weightF32[8192]
-
blk.127.ffn_down.weightQ4_0[28672 8192]
-
blk.127.ffn_gate.weightQ4_0[8192 28672]
-
blk.127.ffn_up.weightQ4_0[8192 28672]
-
blk.127.ffn_norm.weightF32[8192]
-
blk.127.attn_k.weightQ4_0[8192 1024]
-
blk.127.attn_output.weightQ4_0[8192 8192]
-
blk.127.attn_q.weightQ4_0[8192 8192]
-
blk.127.attn_v.weightQ4_0[8192 1024]
-
blk.128.attn_norm.weightF32[8192]
-
blk.128.ffn_down.weightQ4_0[28672 8192]
-
blk.128.ffn_gate.weightQ4_0[8192 28672]
-
blk.128.ffn_up.weightQ4_0[8192 28672]
-
blk.128.ffn_norm.weightF32[8192]
-
blk.128.attn_k.weightQ4_0[8192 1024]
-
blk.128.attn_output.weightQ4_0[8192 8192]
-
blk.128.attn_q.weightQ4_0[8192 8192]
-
blk.128.attn_v.weightQ4_0[8192 1024]
-
blk.129.attn_norm.weightF32[8192]
-
blk.129.ffn_down.weightQ4_0[28672 8192]
-
blk.129.ffn_gate.weightQ4_0[8192 28672]
-
blk.129.ffn_up.weightQ4_0[8192 28672]
-
blk.129.ffn_norm.weightF32[8192]
-
blk.129.attn_k.weightQ4_0[8192 1024]
-
blk.129.attn_output.weightQ4_0[8192 8192]
-
blk.129.attn_q.weightQ4_0[8192 8192]
-
blk.129.attn_v.weightQ4_0[8192 1024]
-
blk.130.attn_norm.weightF32[8192]
-
blk.130.ffn_down.weightQ4_0[28672 8192]
-
blk.130.ffn_gate.weightQ4_0[8192 28672]
-
blk.130.ffn_up.weightQ4_0[8192 28672]
-
blk.130.ffn_norm.weightF32[8192]
-
blk.130.attn_k.weightQ4_0[8192 1024]
-
blk.130.attn_output.weightQ4_0[8192 8192]
-
blk.130.attn_q.weightQ4_0[8192 8192]
-
blk.130.attn_v.weightQ4_0[8192 1024]
-
blk.131.attn_norm.weightF32[8192]
-
blk.131.ffn_down.weightQ4_0[28672 8192]
-
blk.131.ffn_gate.weightQ4_0[8192 28672]
-
blk.131.ffn_up.weightQ4_0[8192 28672]
-
blk.131.ffn_norm.weightF32[8192]
-
blk.131.attn_k.weightQ4_0[8192 1024]
-
blk.131.attn_output.weightQ4_0[8192 8192]
-
blk.131.attn_q.weightQ4_0[8192 8192]
-
blk.131.attn_v.weightQ4_0[8192 1024]
-
blk.132.attn_norm.weightF32[8192]
-
blk.132.ffn_down.weightQ4_0[28672 8192]
-
blk.132.ffn_gate.weightQ4_0[8192 28672]
-
blk.132.ffn_up.weightQ4_0[8192 28672]
-
blk.132.ffn_norm.weightF32[8192]
-
blk.132.attn_k.weightQ4_0[8192 1024]
-
blk.132.attn_output.weightQ4_0[8192 8192]
-
blk.132.attn_q.weightQ4_0[8192 8192]
-
blk.132.attn_v.weightQ4_0[8192 1024]
-
blk.133.attn_norm.weightF32[8192]
-
blk.133.ffn_down.weightQ4_0[28672 8192]
-
blk.133.ffn_gate.weightQ4_0[8192 28672]
-
blk.133.ffn_up.weightQ4_0[8192 28672]
-
blk.133.ffn_norm.weightF32[8192]
-
blk.133.attn_k.weightQ4_0[8192 1024]
-
blk.133.attn_output.weightQ4_0[8192 8192]
-
blk.133.attn_q.weightQ4_0[8192 8192]
-
blk.133.attn_v.weightQ4_0[8192 1024]
-
blk.134.attn_norm.weightF32[8192]
-
blk.134.ffn_down.weightQ4_0[28672 8192]
-
blk.134.ffn_gate.weightQ4_0[8192 28672]
-
blk.134.ffn_up.weightQ4_0[8192 28672]
-
blk.134.ffn_norm.weightF32[8192]
-
blk.134.attn_k.weightQ4_0[8192 1024]
-
blk.134.attn_output.weightQ4_0[8192 8192]
-
blk.134.attn_q.weightQ4_0[8192 8192]
-
blk.134.attn_v.weightQ4_0[8192 1024]
-
blk.135.attn_norm.weightF32[8192]
-
blk.135.ffn_down.weightQ4_0[28672 8192]
-
blk.135.ffn_gate.weightQ4_0[8192 28672]
-
blk.135.ffn_up.weightQ4_0[8192 28672]
-
blk.135.ffn_norm.weightF32[8192]
-
blk.135.attn_k.weightQ4_0[8192 1024]
-
blk.135.attn_output.weightQ4_0[8192 8192]
-
blk.135.attn_q.weightQ4_0[8192 8192]
-
blk.135.attn_v.weightQ4_0[8192 1024]
-
blk.136.attn_norm.weightF32[8192]
-
blk.136.ffn_down.weightQ4_0[28672 8192]
-
blk.136.ffn_gate.weightQ4_0[8192 28672]
-
blk.136.ffn_up.weightQ4_0[8192 28672]
-
blk.136.ffn_norm.weightF32[8192]
-
blk.136.attn_k.weightQ4_0[8192 1024]
-
blk.136.attn_output.weightQ4_0[8192 8192]
-
blk.136.attn_q.weightQ4_0[8192 8192]
-
blk.136.attn_v.weightQ4_0[8192 1024]
-
blk.137.attn_norm.weightF32[8192]
-
blk.137.ffn_down.weightQ4_0[28672 8192]
-
blk.137.ffn_gate.weightQ4_0[8192 28672]
-
blk.137.ffn_up.weightQ4_0[8192 28672]
-
blk.137.ffn_norm.weightF32[8192]
-
blk.137.attn_k.weightQ4_0[8192 1024]
-
blk.137.attn_output.weightQ4_0[8192 8192]
-
blk.137.attn_q.weightQ4_0[8192 8192]
-
blk.137.attn_v.weightQ4_0[8192 1024]
-
blk.138.attn_norm.weightF32[8192]
-
blk.138.ffn_down.weightQ4_0[28672 8192]
-
blk.138.ffn_gate.weightQ4_0[8192 28672]
-
blk.138.ffn_up.weightQ4_0[8192 28672]
-
blk.138.ffn_norm.weightF32[8192]
-
blk.138.attn_k.weightQ4_0[8192 1024]
-
blk.138.attn_output.weightQ4_0[8192 8192]
-
blk.138.attn_q.weightQ4_0[8192 8192]
-
blk.138.attn_v.weightQ4_0[8192 1024]
-
blk.139.attn_norm.weightF32[8192]
-
blk.139.ffn_down.weightQ4_0[28672 8192]
-
blk.139.ffn_gate.weightQ4_0[8192 28672]
-
blk.139.ffn_up.weightQ4_0[8192 28672]
-
blk.139.ffn_norm.weightF32[8192]
-
blk.139.attn_k.weightQ4_0[8192 1024]
-
blk.139.attn_output.weightQ4_0[8192 8192]
-
blk.139.attn_q.weightQ4_0[8192 8192]
-
blk.139.attn_v.weightQ4_0[8192 1024]
-
output.weightQ6_K[8192 32000]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85
blk.86
blk.87
blk.88
blk.89
blk.90
blk.91
blk.92
blk.93
blk.94
blk.95
blk.96
blk.97
blk.98
blk.99
blk.100
blk.101
blk.102
blk.103
blk.104
blk.105
blk.106
blk.107
blk.108
blk.109
blk.110
blk.111
blk.112
blk.113
blk.114
blk.115
blk.116
blk.117
blk.118
blk.119
blk.120
blk.121
blk.122
blk.123
blk.124
blk.125
blk.126
blk.127
blk.128
blk.129
blk.130
blk.131
blk.132
blk.133
blk.134
blk.135
blk.136
blk.137
blk.138
blk.139