latest
5.0GB
9B
Updated 3 weeks ago
9f84320f13e3 · 5.0GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count32
-
llama.attention.head_count_kv4
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count48
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
llama.vocab_size64000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ4_0[4096 64000]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ4_0[11008 4096]
-
blk.0.ffn_gate.weightQ4_0[4096 11008]
-
blk.0.ffn_up.weightQ4_0[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ4_0[4096 512]
-
blk.0.attn_output.weightQ4_0[4096 4096]
-
blk.0.attn_q.weightQ4_0[4096 4096]
-
blk.0.attn_v.weightQ4_0[4096 512]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ4_0[11008 4096]
-
blk.1.ffn_gate.weightQ4_0[4096 11008]
-
blk.1.ffn_up.weightQ4_0[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ4_0[4096 512]
-
blk.1.attn_output.weightQ4_0[4096 4096]
-
blk.1.attn_q.weightQ4_0[4096 4096]
-
blk.1.attn_v.weightQ4_0[4096 512]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ4_0[11008 4096]
-
blk.2.ffn_gate.weightQ4_0[4096 11008]
-
blk.2.ffn_up.weightQ4_0[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ4_0[4096 512]
-
blk.2.attn_output.weightQ4_0[4096 4096]
-
blk.2.attn_q.weightQ4_0[4096 4096]
-
blk.2.attn_v.weightQ4_0[4096 512]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ4_0[11008 4096]
-
blk.3.ffn_gate.weightQ4_0[4096 11008]
-
blk.3.ffn_up.weightQ4_0[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ4_0[4096 512]
-
blk.3.attn_output.weightQ4_0[4096 4096]
-
blk.3.attn_q.weightQ4_0[4096 4096]
-
blk.3.attn_v.weightQ4_0[4096 512]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ4_0[11008 4096]
-
blk.4.ffn_gate.weightQ4_0[4096 11008]
-
blk.4.ffn_up.weightQ4_0[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ4_0[4096 512]
-
blk.4.attn_output.weightQ4_0[4096 4096]
-
blk.4.attn_q.weightQ4_0[4096 4096]
-
blk.4.attn_v.weightQ4_0[4096 512]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ4_0[11008 4096]
-
blk.5.ffn_gate.weightQ4_0[4096 11008]
-
blk.5.ffn_up.weightQ4_0[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weightQ4_0[4096 512]
-
blk.5.attn_output.weightQ4_0[4096 4096]
-
blk.5.attn_q.weightQ4_0[4096 4096]
-
blk.5.attn_v.weightQ4_0[4096 512]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ4_0[11008 4096]
-
blk.6.ffn_gate.weightQ4_0[4096 11008]
-
blk.6.ffn_up.weightQ4_0[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ4_0[4096 512]
-
blk.6.attn_output.weightQ4_0[4096 4096]
-
blk.6.attn_q.weightQ4_0[4096 4096]
-
blk.6.attn_v.weightQ4_0[4096 512]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ4_0[11008 4096]
-
blk.7.ffn_gate.weightQ4_0[4096 11008]
-
blk.7.ffn_up.weightQ4_0[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ4_0[4096 512]
-
blk.7.attn_output.weightQ4_0[4096 4096]
-
blk.7.attn_q.weightQ4_0[4096 4096]
-
blk.7.attn_v.weightQ4_0[4096 512]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ4_0[11008 4096]
-
blk.8.ffn_gate.weightQ4_0[4096 11008]
-
blk.8.ffn_up.weightQ4_0[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ4_0[4096 512]
-
blk.8.attn_output.weightQ4_0[4096 4096]
-
blk.8.attn_q.weightQ4_0[4096 4096]
-
blk.8.attn_v.weightQ4_0[4096 512]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ4_0[11008 4096]
-
blk.9.ffn_gate.weightQ4_0[4096 11008]
-
blk.9.ffn_up.weightQ4_0[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ4_0[4096 512]
-
blk.9.attn_output.weightQ4_0[4096 4096]
-
blk.9.attn_q.weightQ4_0[4096 4096]
-
blk.9.attn_v.weightQ4_0[4096 512]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ4_0[11008 4096]
-
blk.10.ffn_gate.weightQ4_0[4096 11008]
-
blk.10.ffn_up.weightQ4_0[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ4_0[4096 512]
-
blk.10.attn_output.weightQ4_0[4096 4096]
-
blk.10.attn_q.weightQ4_0[4096 4096]
-
blk.10.attn_v.weightQ4_0[4096 512]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ4_0[11008 4096]
-
blk.11.ffn_gate.weightQ4_0[4096 11008]
-
blk.11.ffn_up.weightQ4_0[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weightQ4_0[4096 512]
-
blk.11.attn_output.weightQ4_0[4096 4096]
-
blk.11.attn_q.weightQ4_0[4096 4096]
-
blk.11.attn_v.weightQ4_0[4096 512]
-
blk.12.ffn_gate.weightQ4_0[4096 11008]
-
blk.12.ffn_up.weightQ4_0[4096 11008]
-
blk.12.attn_k.weightQ4_0[4096 512]
-
blk.12.attn_output.weightQ4_0[4096 4096]
-
blk.12.attn_q.weightQ4_0[4096 4096]
-
blk.12.attn_v.weightQ4_0[4096 512]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ4_0[11008 4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ4_0[11008 4096]
-
blk.13.ffn_gate.weightQ4_0[4096 11008]
-
blk.13.ffn_up.weightQ4_0[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ4_0[4096 512]
-
blk.13.attn_output.weightQ4_0[4096 4096]
-
blk.13.attn_q.weightQ4_0[4096 4096]
-
blk.13.attn_v.weightQ4_0[4096 512]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ4_0[11008 4096]
-
blk.14.ffn_gate.weightQ4_0[4096 11008]
-
blk.14.ffn_up.weightQ4_0[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ4_0[4096 512]
-
blk.14.attn_output.weightQ4_0[4096 4096]
-
blk.14.attn_q.weightQ4_0[4096 4096]
-
blk.14.attn_v.weightQ4_0[4096 512]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ4_0[11008 4096]
-
blk.15.ffn_gate.weightQ4_0[4096 11008]
-
blk.15.ffn_up.weightQ4_0[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ4_0[4096 512]
-
blk.15.attn_output.weightQ4_0[4096 4096]
-
blk.15.attn_q.weightQ4_0[4096 4096]
-
blk.15.attn_v.weightQ4_0[4096 512]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ4_0[11008 4096]
-
blk.16.ffn_gate.weightQ4_0[4096 11008]
-
blk.16.ffn_up.weightQ4_0[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ4_0[4096 512]
-
blk.16.attn_output.weightQ4_0[4096 4096]
-
blk.16.attn_q.weightQ4_0[4096 4096]
-
blk.16.attn_v.weightQ4_0[4096 512]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ4_0[11008 4096]
-
blk.17.ffn_gate.weightQ4_0[4096 11008]
-
blk.17.ffn_up.weightQ4_0[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weightQ4_0[4096 512]
-
blk.17.attn_output.weightQ4_0[4096 4096]
-
blk.17.attn_q.weightQ4_0[4096 4096]
-
blk.17.attn_v.weightQ4_0[4096 512]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ4_0[11008 4096]
-
blk.18.ffn_gate.weightQ4_0[4096 11008]
-
blk.18.ffn_up.weightQ4_0[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ4_0[4096 512]
-
blk.18.attn_output.weightQ4_0[4096 4096]
-
blk.18.attn_q.weightQ4_0[4096 4096]
-
blk.18.attn_v.weightQ4_0[4096 512]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ4_0[11008 4096]
-
blk.19.ffn_gate.weightQ4_0[4096 11008]
-
blk.19.ffn_up.weightQ4_0[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ4_0[4096 512]
-
blk.19.attn_output.weightQ4_0[4096 4096]
-
blk.19.attn_q.weightQ4_0[4096 4096]
-
blk.19.attn_v.weightQ4_0[4096 512]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ4_0[11008 4096]
-
blk.20.ffn_gate.weightQ4_0[4096 11008]
-
blk.20.ffn_up.weightQ4_0[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ4_0[4096 512]
-
blk.20.attn_output.weightQ4_0[4096 4096]
-
blk.20.attn_q.weightQ4_0[4096 4096]
-
blk.20.attn_v.weightQ4_0[4096 512]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ4_0[11008 4096]
-
blk.21.ffn_gate.weightQ4_0[4096 11008]
-
blk.21.ffn_up.weightQ4_0[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ4_0[4096 512]
-
blk.21.attn_output.weightQ4_0[4096 4096]
-
blk.21.attn_q.weightQ4_0[4096 4096]
-
blk.21.attn_v.weightQ4_0[4096 512]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ4_0[11008 4096]
-
blk.22.ffn_gate.weightQ4_0[4096 11008]
-
blk.22.ffn_up.weightQ4_0[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ4_0[4096 512]
-
blk.22.attn_output.weightQ4_0[4096 4096]
-
blk.22.attn_q.weightQ4_0[4096 4096]
-
blk.22.attn_v.weightQ4_0[4096 512]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ4_0[11008 4096]
-
blk.23.ffn_gate.weightQ4_0[4096 11008]
-
blk.23.ffn_up.weightQ4_0[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weightQ4_0[4096 512]
-
blk.23.attn_output.weightQ4_0[4096 4096]
-
blk.23.attn_q.weightQ4_0[4096 4096]
-
blk.23.attn_v.weightQ4_0[4096 512]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ4_0[11008 4096]
-
blk.24.ffn_gate.weightQ4_0[4096 11008]
-
blk.24.ffn_up.weightQ4_0[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ4_0[4096 512]
-
blk.24.attn_output.weightQ4_0[4096 4096]
-
blk.24.attn_q.weightQ4_0[4096 4096]
-
blk.24.attn_v.weightQ4_0[4096 512]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ4_0[11008 4096]
-
blk.25.ffn_gate.weightQ4_0[4096 11008]
-
blk.25.ffn_up.weightQ4_0[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ4_0[4096 512]
-
blk.25.attn_output.weightQ4_0[4096 4096]
-
blk.25.attn_q.weightQ4_0[4096 4096]
-
blk.25.attn_v.weightQ4_0[4096 512]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ4_0[11008 4096]
-
blk.26.ffn_gate.weightQ4_0[4096 11008]
-
blk.26.ffn_up.weightQ4_0[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ4_0[4096 512]
-
blk.26.attn_output.weightQ4_0[4096 4096]
-
blk.26.attn_q.weightQ4_0[4096 4096]
-
blk.26.attn_v.weightQ4_0[4096 512]
-
blk.27.attn_k.weightQ4_0[4096 512]
-
blk.27.attn_q.weightQ4_0[4096 4096]
-
blk.27.attn_v.weightQ4_0[4096 512]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ4_0[11008 4096]
-
blk.27.ffn_gate.weightQ4_0[4096 11008]
-
blk.27.ffn_up.weightQ4_0[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_output.weightQ4_0[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ4_0[11008 4096]
-
blk.28.ffn_gate.weightQ4_0[4096 11008]
-
blk.28.ffn_up.weightQ4_0[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ4_0[4096 512]
-
blk.28.attn_output.weightQ4_0[4096 4096]
-
blk.28.attn_q.weightQ4_0[4096 4096]
-
blk.28.attn_v.weightQ4_0[4096 512]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ4_0[11008 4096]
-
blk.29.ffn_gate.weightQ4_0[4096 11008]
-
blk.29.ffn_up.weightQ4_0[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weightQ4_0[4096 512]
-
blk.29.attn_output.weightQ4_0[4096 4096]
-
blk.29.attn_q.weightQ4_0[4096 4096]
-
blk.29.attn_v.weightQ4_0[4096 512]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ4_0[11008 4096]
-
blk.30.ffn_gate.weightQ4_0[4096 11008]
-
blk.30.ffn_up.weightQ4_0[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ4_0[4096 512]
-
blk.30.attn_output.weightQ4_0[4096 4096]
-
blk.30.attn_q.weightQ4_0[4096 4096]
-
blk.30.attn_v.weightQ4_0[4096 512]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ4_0[11008 4096]
-
blk.31.ffn_gate.weightQ4_0[4096 11008]
-
blk.31.ffn_up.weightQ4_0[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ4_0[4096 512]
-
blk.31.attn_output.weightQ4_0[4096 4096]
-
blk.31.attn_q.weightQ4_0[4096 4096]
-
blk.31.attn_v.weightQ4_0[4096 512]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weightQ4_0[11008 4096]
-
blk.32.ffn_gate.weightQ4_0[4096 11008]
-
blk.32.ffn_up.weightQ4_0[4096 11008]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weightQ4_0[4096 512]
-
blk.32.attn_output.weightQ4_0[4096 4096]
-
blk.32.attn_q.weightQ4_0[4096 4096]
-
blk.32.attn_v.weightQ4_0[4096 512]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weightQ4_0[11008 4096]
-
blk.33.ffn_gate.weightQ4_0[4096 11008]
-
blk.33.ffn_up.weightQ4_0[4096 11008]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.attn_k.weightQ4_0[4096 512]
-
blk.33.attn_output.weightQ4_0[4096 4096]
-
blk.33.attn_q.weightQ4_0[4096 4096]
-
blk.33.attn_v.weightQ4_0[4096 512]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weightQ4_0[11008 4096]
-
blk.34.ffn_gate.weightQ4_0[4096 11008]
-
blk.34.ffn_up.weightQ4_0[4096 11008]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weightQ4_0[4096 512]
-
blk.34.attn_output.weightQ4_0[4096 4096]
-
blk.34.attn_q.weightQ4_0[4096 4096]
-
blk.34.attn_v.weightQ4_0[4096 512]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weightQ4_0[11008 4096]
-
blk.35.ffn_gate.weightQ4_0[4096 11008]
-
blk.35.ffn_up.weightQ4_0[4096 11008]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weightQ4_0[4096 512]
-
blk.35.attn_output.weightQ4_0[4096 4096]
-
blk.35.attn_q.weightQ4_0[4096 4096]
-
blk.35.attn_v.weightQ4_0[4096 512]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weightQ4_0[11008 4096]
-
blk.36.ffn_gate.weightQ4_0[4096 11008]
-
blk.36.ffn_up.weightQ4_0[4096 11008]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weightQ4_0[4096 512]
-
blk.36.attn_output.weightQ4_0[4096 4096]
-
blk.36.attn_q.weightQ4_0[4096 4096]
-
blk.36.attn_v.weightQ4_0[4096 512]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weightQ4_0[11008 4096]
-
blk.37.ffn_gate.weightQ4_0[4096 11008]
-
blk.37.ffn_up.weightQ4_0[4096 11008]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weightQ4_0[4096 512]
-
blk.37.attn_output.weightQ4_0[4096 4096]
-
blk.37.attn_q.weightQ4_0[4096 4096]
-
blk.37.attn_v.weightQ4_0[4096 512]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weightQ4_0[11008 4096]
-
blk.38.ffn_gate.weightQ4_0[4096 11008]
-
blk.38.ffn_up.weightQ4_0[4096 11008]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weightQ4_0[4096 512]
-
blk.38.attn_output.weightQ4_0[4096 4096]
-
blk.38.attn_q.weightQ4_0[4096 4096]
-
blk.38.attn_v.weightQ4_0[4096 512]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weightQ4_0[11008 4096]
-
blk.39.ffn_gate.weightQ4_0[4096 11008]
-
blk.39.ffn_up.weightQ4_0[4096 11008]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weightQ4_0[4096 512]
-
blk.39.attn_output.weightQ4_0[4096 4096]
-
blk.39.attn_q.weightQ4_0[4096 4096]
-
blk.39.attn_v.weightQ4_0[4096 512]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weightQ4_0[11008 4096]
-
blk.40.ffn_gate.weightQ4_0[4096 11008]
-
blk.40.ffn_up.weightQ4_0[4096 11008]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weightQ4_0[4096 512]
-
blk.40.attn_output.weightQ4_0[4096 4096]
-
blk.40.attn_q.weightQ4_0[4096 4096]
-
blk.40.attn_v.weightQ4_0[4096 512]
-
blk.41.ffn_gate.weightQ4_0[4096 11008]
-
blk.41.attn_k.weightQ4_0[4096 512]
-
blk.41.attn_output.weightQ4_0[4096 4096]
-
blk.41.attn_q.weightQ4_0[4096 4096]
-
blk.41.attn_v.weightQ4_0[4096 512]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weightQ4_0[11008 4096]
-
blk.41.ffn_up.weightQ4_0[4096 11008]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weightQ4_0[11008 4096]
-
blk.42.ffn_gate.weightQ4_0[4096 11008]
-
blk.42.ffn_up.weightQ4_0[4096 11008]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weightQ4_0[4096 512]
-
blk.42.attn_output.weightQ4_0[4096 4096]
-
blk.42.attn_q.weightQ4_0[4096 4096]
-
blk.42.attn_v.weightQ4_0[4096 512]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weightQ4_0[11008 4096]
-
blk.43.ffn_gate.weightQ4_0[4096 11008]
-
blk.43.ffn_up.weightQ4_0[4096 11008]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weightQ4_0[4096 512]
-
blk.43.attn_output.weightQ4_0[4096 4096]
-
blk.43.attn_q.weightQ4_0[4096 4096]
-
blk.43.attn_v.weightQ4_0[4096 512]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weightQ4_0[11008 4096]
-
blk.44.ffn_gate.weightQ4_0[4096 11008]
-
blk.44.ffn_up.weightQ4_0[4096 11008]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.attn_k.weightQ4_0[4096 512]
-
blk.44.attn_output.weightQ4_0[4096 4096]
-
blk.44.attn_q.weightQ4_0[4096 4096]
-
blk.44.attn_v.weightQ4_0[4096 512]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weightQ4_0[11008 4096]
-
blk.45.ffn_gate.weightQ4_0[4096 11008]
-
blk.45.ffn_up.weightQ4_0[4096 11008]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weightQ4_0[4096 512]
-
blk.45.attn_output.weightQ4_0[4096 4096]
-
blk.45.attn_q.weightQ4_0[4096 4096]
-
blk.45.attn_v.weightQ4_0[4096 512]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weightQ4_0[11008 4096]
-
blk.46.ffn_gate.weightQ4_0[4096 11008]
-
blk.46.ffn_up.weightQ4_0[4096 11008]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weightQ4_0[4096 512]
-
blk.46.attn_output.weightQ4_0[4096 4096]
-
blk.46.attn_q.weightQ4_0[4096 4096]
-
blk.46.attn_v.weightQ4_0[4096 512]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weightQ4_0[11008 4096]
-
blk.47.ffn_gate.weightQ4_0[4096 11008]
-
blk.47.ffn_up.weightQ4_0[4096 11008]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weightQ4_0[4096 512]
-
blk.47.attn_output.weightQ4_0[4096 4096]
-
blk.47.attn_q.weightQ4_0[4096 4096]
-
blk.47.attn_v.weightQ4_0[4096 512]
-
output.weightQ6_K[4096 64000]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47