latest
5.0GB
First upload of a huggingface model that has been quantized to use 4-bit weights (Q4_0).
9B
2 Pulls Updated 2 weeks ago
b40d03930df5 · 5.0GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count32
-
llama.attention.head_count_kv4
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count48
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
llama.vocab_size64000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ4_0[4096 64000]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ4_0[11008 4096]
-
blk.0.ffn_gate.weightQ4_0[4096 11008]
-
blk.0.ffn_up.weightQ4_0[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ4_0[4096 512]
-
blk.0.attn_output.weightQ4_0[4096 4096]
-
blk.0.attn_q.weightQ4_0[4096 4096]
-
blk.0.attn_v.weightQ4_0[4096 512]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ4_0[11008 4096]
-
blk.1.ffn_gate.weightQ4_0[4096 11008]
-
blk.1.ffn_up.weightQ4_0[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ4_0[4096 512]
-
blk.1.attn_output.weightQ4_0[4096 4096]
-
blk.1.attn_q.weightQ4_0[4096 4096]
-
blk.1.attn_v.weightQ4_0[4096 512]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ4_0[11008 4096]
-
blk.2.ffn_gate.weightQ4_0[4096 11008]
-
blk.2.ffn_up.weightQ4_0[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ4_0[4096 512]
-
blk.2.attn_output.weightQ4_0[4096 4096]
-
blk.2.attn_q.weightQ4_0[4096 4096]
-
blk.2.attn_v.weightQ4_0[4096 512]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ4_0[11008 4096]
-
blk.3.ffn_gate.weightQ4_0[4096 11008]
-
blk.3.ffn_up.weightQ4_0[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ4_0[4096 512]
-
blk.3.attn_output.weightQ4_0[4096 4096]
-
blk.3.attn_q.weightQ4_0[4096 4096]
-
blk.3.attn_v.weightQ4_0[4096 512]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ4_0[11008 4096]
-
blk.4.ffn_gate.weightQ4_0[4096 11008]
-
blk.4.ffn_up.weightQ4_0[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ4_0[4096 512]
-
blk.4.attn_output.weightQ4_0[4096 4096]
-
blk.4.attn_q.weightQ4_0[4096 4096]
-
blk.4.attn_v.weightQ4_0[4096 512]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ4_0[11008 4096]
-
blk.5.ffn_gate.weightQ4_0[4096 11008]
-
blk.5.ffn_up.weightQ4_0[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weightQ4_0[4096 512]
-
blk.5.attn_output.weightQ4_0[4096 4096]
-
blk.5.attn_q.weightQ4_0[4096 4096]
-
blk.5.attn_v.weightQ4_0[4096 512]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ4_0[11008 4096]
-
blk.6.ffn_gate.weightQ4_0[4096 11008]
-
blk.6.ffn_up.weightQ4_0[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ4_0[4096 512]
-
blk.6.attn_output.weightQ4_0[4096 4096]
-
blk.6.attn_q.weightQ4_0[4096 4096]
-
blk.6.attn_v.weightQ4_0[4096 512]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ4_0[11008 4096]
-
blk.7.ffn_gate.weightQ4_0[4096 11008]
-
blk.7.ffn_up.weightQ4_0[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ4_0[4096 512]
-
blk.7.attn_output.weightQ4_0[4096 4096]
-
blk.7.attn_q.weightQ4_0[4096 4096]
-
blk.7.attn_v.weightQ4_0[4096 512]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ4_0[11008 4096]
-
blk.8.ffn_gate.weightQ4_0[4096 11008]
-
blk.8.ffn_up.weightQ4_0[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ4_0[4096 512]
-
blk.8.attn_output.weightQ4_0[4096 4096]
-
blk.8.attn_q.weightQ4_0[4096 4096]
-
blk.8.attn_v.weightQ4_0[4096 512]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ4_0[11008 4096]
-
blk.9.ffn_gate.weightQ4_0[4096 11008]
-
blk.9.ffn_up.weightQ4_0[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ4_0[4096 512]
-
blk.9.attn_output.weightQ4_0[4096 4096]
-
blk.9.attn_q.weightQ4_0[4096 4096]
-
blk.9.attn_v.weightQ4_0[4096 512]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ4_0[11008 4096]
-
blk.10.ffn_gate.weightQ4_0[4096 11008]
-
blk.10.ffn_up.weightQ4_0[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ4_0[4096 512]
-
blk.10.attn_output.weightQ4_0[4096 4096]
-
blk.10.attn_q.weightQ4_0[4096 4096]
-
blk.10.attn_v.weightQ4_0[4096 512]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ4_0[11008 4096]
-
blk.11.ffn_gate.weightQ4_0[4096 11008]
-
blk.11.ffn_up.weightQ4_0[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weightQ4_0[4096 512]
-
blk.11.attn_output.weightQ4_0[4096 4096]
-
blk.11.attn_q.weightQ4_0[4096 4096]
-
blk.11.attn_v.weightQ4_0[4096 512]
-
blk.12.ffn_gate.weightQ4_0[4096 11008]
-
blk.12.ffn_up.weightQ4_0[4096 11008]
-
blk.12.attn_k.weightQ4_0[4096 512]
-
blk.12.attn_output.weightQ4_0[4096 4096]
-
blk.12.attn_q.weightQ4_0[4096 4096]
-
blk.12.attn_v.weightQ4_0[4096 512]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ4_0[11008 4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ4_0[11008 4096]
-
blk.13.ffn_gate.weightQ4_0[4096 11008]
-
blk.13.ffn_up.weightQ4_0[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ4_0[4096 512]
-
blk.13.attn_output.weightQ4_0[4096 4096]
-
blk.13.attn_q.weightQ4_0[4096 4096]
-
blk.13.attn_v.weightQ4_0[4096 512]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ4_0[11008 4096]
-
blk.14.ffn_gate.weightQ4_0[4096 11008]
-
blk.14.ffn_up.weightQ4_0[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ4_0[4096 512]
-
blk.14.attn_output.weightQ4_0[4096 4096]
-
blk.14.attn_q.weightQ4_0[4096 4096]
-
blk.14.attn_v.weightQ4_0[4096 512]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ4_0[11008 4096]
-
blk.15.ffn_gate.weightQ4_0[4096 11008]
-
blk.15.ffn_up.weightQ4_0[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ4_0[4096 512]
-
blk.15.attn_output.weightQ4_0[4096 4096]
-
blk.15.attn_q.weightQ4_0[4096 4096]
-
blk.15.attn_v.weightQ4_0[4096 512]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ4_0[11008 4096]
-
blk.16.ffn_gate.weightQ4_0[4096 11008]
-
blk.16.ffn_up.weightQ4_0[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ4_0[4096 512]
-
blk.16.attn_output.weightQ4_0[4096 4096]
-
blk.16.attn_q.weightQ4_0[4096 4096]
-
blk.16.attn_v.weightQ4_0[4096 512]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ4_0[11008 4096]
-
blk.17.ffn_gate.weightQ4_0[4096 11008]
-
blk.17.ffn_up.weightQ4_0[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weightQ4_0[4096 512]
-
blk.17.attn_output.weightQ4_0[4096 4096]
-
blk.17.attn_q.weightQ4_0[4096 4096]
-
blk.17.attn_v.weightQ4_0[4096 512]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ4_0[11008 4096]
-
blk.18.ffn_gate.weightQ4_0[4096 11008]
-
blk.18.ffn_up.weightQ4_0[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ4_0[4096 512]
-
blk.18.attn_output.weightQ4_0[4096 4096]
-
blk.18.attn_q.weightQ4_0[4096 4096]
-
blk.18.attn_v.weightQ4_0[4096 512]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ4_0[11008 4096]
-
blk.19.ffn_gate.weightQ4_0[4096 11008]
-
blk.19.ffn_up.weightQ4_0[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ4_0[4096 512]
-
blk.19.attn_output.weightQ4_0[4096 4096]
-
blk.19.attn_q.weightQ4_0[4096 4096]
-
blk.19.attn_v.weightQ4_0[4096 512]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ4_0[11008 4096]
-
blk.20.ffn_gate.weightQ4_0[4096 11008]
-
blk.20.ffn_up.weightQ4_0[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ4_0[4096 512]
-
blk.20.attn_output.weightQ4_0[4096 4096]
-
blk.20.attn_q.weightQ4_0[4096 4096]
-
blk.20.attn_v.weightQ4_0[4096 512]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ4_0[11008 4096]
-
blk.21.ffn_gate.weightQ4_0[4096 11008]
-
blk.21.ffn_up.weightQ4_0[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ4_0[4096 512]
-
blk.21.attn_output.weightQ4_0[4096 4096]
-
blk.21.attn_q.weightQ4_0[4096 4096]
-
blk.21.attn_v.weightQ4_0[4096 512]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ4_0[11008 4096]
-
blk.22.ffn_gate.weightQ4_0[4096 11008]
-
blk.22.ffn_up.weightQ4_0[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ4_0[4096 512]
-
blk.22.attn_output.weightQ4_0[4096 4096]
-
blk.22.attn_q.weightQ4_0[4096 4096]
-
blk.22.attn_v.weightQ4_0[4096 512]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ4_0[11008 4096]
-
blk.23.ffn_gate.weightQ4_0[4096 11008]
-
blk.23.ffn_up.weightQ4_0[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weightQ4_0[4096 512]
-
blk.23.attn_output.weightQ4_0[4096 4096]
-
blk.23.attn_q.weightQ4_0[4096 4096]
-
blk.23.attn_v.weightQ4_0[4096 512]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ4_0[11008 4096]
-
blk.24.ffn_gate.weightQ4_0[4096 11008]
-
blk.24.ffn_up.weightQ4_0[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ4_0[4096 512]
-
blk.24.attn_output.weightQ4_0[4096 4096]
-
blk.24.attn_q.weightQ4_0[4096 4096]
-
blk.24.attn_v.weightQ4_0[4096 512]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ4_0[11008 4096]
-
blk.25.ffn_gate.weightQ4_0[4096 11008]
-
blk.25.ffn_up.weightQ4_0[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ4_0[4096 512]
-
blk.25.attn_output.weightQ4_0[4096 4096]
-
blk.25.attn_q.weightQ4_0[4096 4096]
-
blk.25.attn_v.weightQ4_0[4096 512]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ4_0[11008 4096]
-
blk.26.ffn_gate.weightQ4_0[4096 11008]
-
blk.26.ffn_up.weightQ4_0[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ4_0[4096 512]
-
blk.26.attn_output.weightQ4_0[4096 4096]
-
blk.26.attn_q.weightQ4_0[4096 4096]
-
blk.26.attn_v.weightQ4_0[4096 512]
-
blk.27.attn_k.weightQ4_0[4096 512]
-
blk.27.attn_q.weightQ4_0[4096 4096]
-
blk.27.attn_v.weightQ4_0[4096 512]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ4_0[11008 4096]
-
blk.27.ffn_gate.weightQ4_0[4096 11008]
-
blk.27.ffn_up.weightQ4_0[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_output.weightQ4_0[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ4_0[11008 4096]
-
blk.28.ffn_gate.weightQ4_0[4096 11008]
-
blk.28.ffn_up.weightQ4_0[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ4_0[4096 512]
-
blk.28.attn_output.weightQ4_0[4096 4096]
-
blk.28.attn_q.weightQ4_0[4096 4096]
-
blk.28.attn_v.weightQ4_0[4096 512]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ4_0[11008 4096]
-
blk.29.ffn_gate.weightQ4_0[4096 11008]
-
blk.29.ffn_up.weightQ4_0[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weightQ4_0[4096 512]
-
blk.29.attn_output.weightQ4_0[4096 4096]
-
blk.29.attn_q.weightQ4_0[4096 4096]
-
blk.29.attn_v.weightQ4_0[4096 512]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ4_0[11008 4096]
-
blk.30.ffn_gate.weightQ4_0[4096 11008]
-
blk.30.ffn_up.weightQ4_0[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ4_0[4096 512]
-
blk.30.attn_output.weightQ4_0[4096 4096]
-
blk.30.attn_q.weightQ4_0[4096 4096]
-
blk.30.attn_v.weightQ4_0[4096 512]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ4_0[11008 4096]
-
blk.31.ffn_gate.weightQ4_0[4096 11008]
-
blk.31.ffn_up.weightQ4_0[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ4_0[4096 512]
-
blk.31.attn_output.weightQ4_0[4096 4096]
-
blk.31.attn_q.weightQ4_0[4096 4096]
-
blk.31.attn_v.weightQ4_0[4096 512]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weightQ4_0[11008 4096]
-
blk.32.ffn_gate.weightQ4_0[4096 11008]
-
blk.32.ffn_up.weightQ4_0[4096 11008]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weightQ4_0[4096 512]
-
blk.32.attn_output.weightQ4_0[4096 4096]
-
blk.32.attn_q.weightQ4_0[4096 4096]
-
blk.32.attn_v.weightQ4_0[4096 512]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weightQ4_0[11008 4096]
-
blk.33.ffn_gate.weightQ4_0[4096 11008]
-
blk.33.ffn_up.weightQ4_0[4096 11008]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.attn_k.weightQ4_0[4096 512]
-
blk.33.attn_output.weightQ4_0[4096 4096]
-
blk.33.attn_q.weightQ4_0[4096 4096]
-
blk.33.attn_v.weightQ4_0[4096 512]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weightQ4_0[11008 4096]
-
blk.34.ffn_gate.weightQ4_0[4096 11008]
-
blk.34.ffn_up.weightQ4_0[4096 11008]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weightQ4_0[4096 512]
-
blk.34.attn_output.weightQ4_0[4096 4096]
-
blk.34.attn_q.weightQ4_0[4096 4096]
-
blk.34.attn_v.weightQ4_0[4096 512]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weightQ4_0[11008 4096]
-
blk.35.ffn_gate.weightQ4_0[4096 11008]
-
blk.35.ffn_up.weightQ4_0[4096 11008]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weightQ4_0[4096 512]
-
blk.35.attn_output.weightQ4_0[4096 4096]
-
blk.35.attn_q.weightQ4_0[4096 4096]
-
blk.35.attn_v.weightQ4_0[4096 512]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weightQ4_0[11008 4096]
-
blk.36.ffn_gate.weightQ4_0[4096 11008]
-
blk.36.ffn_up.weightQ4_0[4096 11008]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weightQ4_0[4096 512]
-
blk.36.attn_output.weightQ4_0[4096 4096]
-
blk.36.attn_q.weightQ4_0[4096 4096]
-
blk.36.attn_v.weightQ4_0[4096 512]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weightQ4_0[11008 4096]
-
blk.37.ffn_gate.weightQ4_0[4096 11008]
-
blk.37.ffn_up.weightQ4_0[4096 11008]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weightQ4_0[4096 512]
-
blk.37.attn_output.weightQ4_0[4096 4096]
-
blk.37.attn_q.weightQ4_0[4096 4096]
-
blk.37.attn_v.weightQ4_0[4096 512]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weightQ4_0[11008 4096]
-
blk.38.ffn_gate.weightQ4_0[4096 11008]
-
blk.38.ffn_up.weightQ4_0[4096 11008]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weightQ4_0[4096 512]
-
blk.38.attn_output.weightQ4_0[4096 4096]
-
blk.38.attn_q.weightQ4_0[4096 4096]
-
blk.38.attn_v.weightQ4_0[4096 512]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weightQ4_0[11008 4096]
-
blk.39.ffn_gate.weightQ4_0[4096 11008]
-
blk.39.ffn_up.weightQ4_0[4096 11008]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weightQ4_0[4096 512]
-
blk.39.attn_output.weightQ4_0[4096 4096]
-
blk.39.attn_q.weightQ4_0[4096 4096]
-
blk.39.attn_v.weightQ4_0[4096 512]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weightQ4_0[11008 4096]
-
blk.40.ffn_gate.weightQ4_0[4096 11008]
-
blk.40.ffn_up.weightQ4_0[4096 11008]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weightQ4_0[4096 512]
-
blk.40.attn_output.weightQ4_0[4096 4096]
-
blk.40.attn_q.weightQ4_0[4096 4096]
-
blk.40.attn_v.weightQ4_0[4096 512]
-
blk.41.ffn_gate.weightQ4_0[4096 11008]
-
blk.41.attn_k.weightQ4_0[4096 512]
-
blk.41.attn_output.weightQ4_0[4096 4096]
-
blk.41.attn_q.weightQ4_0[4096 4096]
-
blk.41.attn_v.weightQ4_0[4096 512]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weightQ4_0[11008 4096]
-
blk.41.ffn_up.weightQ4_0[4096 11008]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weightQ4_0[11008 4096]
-
blk.42.ffn_gate.weightQ4_0[4096 11008]
-
blk.42.ffn_up.weightQ4_0[4096 11008]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weightQ4_0[4096 512]
-
blk.42.attn_output.weightQ4_0[4096 4096]
-
blk.42.attn_q.weightQ4_0[4096 4096]
-
blk.42.attn_v.weightQ4_0[4096 512]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weightQ4_0[11008 4096]
-
blk.43.ffn_gate.weightQ4_0[4096 11008]
-
blk.43.ffn_up.weightQ4_0[4096 11008]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weightQ4_0[4096 512]
-
blk.43.attn_output.weightQ4_0[4096 4096]
-
blk.43.attn_q.weightQ4_0[4096 4096]
-
blk.43.attn_v.weightQ4_0[4096 512]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weightQ4_0[11008 4096]
-
blk.44.ffn_gate.weightQ4_0[4096 11008]
-
blk.44.ffn_up.weightQ4_0[4096 11008]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.attn_k.weightQ4_0[4096 512]
-
blk.44.attn_output.weightQ4_0[4096 4096]
-
blk.44.attn_q.weightQ4_0[4096 4096]
-
blk.44.attn_v.weightQ4_0[4096 512]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weightQ4_0[11008 4096]
-
blk.45.ffn_gate.weightQ4_0[4096 11008]
-
blk.45.ffn_up.weightQ4_0[4096 11008]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weightQ4_0[4096 512]
-
blk.45.attn_output.weightQ4_0[4096 4096]
-
blk.45.attn_q.weightQ4_0[4096 4096]
-
blk.45.attn_v.weightQ4_0[4096 512]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weightQ4_0[11008 4096]
-
blk.46.ffn_gate.weightQ4_0[4096 11008]
-
blk.46.ffn_up.weightQ4_0[4096 11008]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weightQ4_0[4096 512]
-
blk.46.attn_output.weightQ4_0[4096 4096]
-
blk.46.attn_q.weightQ4_0[4096 4096]
-
blk.46.attn_v.weightQ4_0[4096 512]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weightQ4_0[11008 4096]
-
blk.47.ffn_gate.weightQ4_0[4096 11008]
-
blk.47.ffn_up.weightQ4_0[4096 11008]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weightQ4_0[4096 512]
-
blk.47.attn_output.weightQ4_0[4096 4096]
-
blk.47.attn_q.weightQ4_0[4096 4096]
-
blk.47.attn_v.weightQ4_0[4096 512]
-
output.weightQ6_K[4096 64000]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47