34b
20GB
Vision
34B
16 Pulls Updated 7 months ago
00c39c2649c0 · 19GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count60
-
llama.context_length4096
-
llama.embedding_length7168
-
llama.feed_forward_length20480
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id7
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ4_0[7168 64000]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_down.weightQ4_0[20480 7168]
-
blk.0.ffn_gate.weightQ4_0[7168 20480]
-
blk.0.ffn_up.weightQ4_0[7168 20480]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.0.attn_k.weightQ4_0[7168 1024]
-
blk.0.attn_output.weightQ4_0[7168 7168]
-
blk.0.attn_q.weightQ4_0[7168 7168]
-
blk.0.attn_v.weightQ4_0[7168 1024]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_down.weightQ4_0[20480 7168]
-
blk.1.ffn_gate.weightQ4_0[7168 20480]
-
blk.1.ffn_up.weightQ4_0[7168 20480]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.1.attn_k.weightQ4_0[7168 1024]
-
blk.1.attn_output.weightQ4_0[7168 7168]
-
blk.1.attn_q.weightQ4_0[7168 7168]
-
blk.1.attn_v.weightQ4_0[7168 1024]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_down.weightQ4_0[20480 7168]
-
blk.2.ffn_gate.weightQ4_0[7168 20480]
-
blk.2.ffn_up.weightQ4_0[7168 20480]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.2.attn_k.weightQ4_0[7168 1024]
-
blk.2.attn_output.weightQ4_0[7168 7168]
-
blk.2.attn_q.weightQ4_0[7168 7168]
-
blk.2.attn_v.weightQ4_0[7168 1024]
-
blk.3.ffn_gate.weightQ4_0[7168 20480]
-
blk.3.attn_k.weightQ4_0[7168 1024]
-
blk.3.attn_output.weightQ4_0[7168 7168]
-
blk.3.attn_q.weightQ4_0[7168 7168]
-
blk.3.attn_v.weightQ4_0[7168 1024]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_down.weightQ4_0[20480 7168]
-
blk.3.ffn_up.weightQ4_0[7168 20480]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_down.weightQ4_0[20480 7168]
-
blk.4.ffn_gate.weightQ4_0[7168 20480]
-
blk.4.ffn_up.weightQ4_0[7168 20480]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.4.attn_k.weightQ4_0[7168 1024]
-
blk.4.attn_output.weightQ4_0[7168 7168]
-
blk.4.attn_q.weightQ4_0[7168 7168]
-
blk.4.attn_v.weightQ4_0[7168 1024]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_down.weightQ4_0[20480 7168]
-
blk.5.ffn_gate.weightQ4_0[7168 20480]
-
blk.5.ffn_up.weightQ4_0[7168 20480]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.5.attn_k.weightQ4_0[7168 1024]
-
blk.5.attn_output.weightQ4_0[7168 7168]
-
blk.5.attn_q.weightQ4_0[7168 7168]
-
blk.5.attn_v.weightQ4_0[7168 1024]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_down.weightQ4_0[20480 7168]
-
blk.6.ffn_gate.weightQ4_0[7168 20480]
-
blk.6.ffn_up.weightQ4_0[7168 20480]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.6.attn_k.weightQ4_0[7168 1024]
-
blk.6.attn_output.weightQ4_0[7168 7168]
-
blk.6.attn_q.weightQ4_0[7168 7168]
-
blk.6.attn_v.weightQ4_0[7168 1024]
-
blk.7.ffn_gate.weightQ4_0[7168 20480]
-
blk.7.ffn_up.weightQ4_0[7168 20480]
-
blk.7.attn_k.weightQ4_0[7168 1024]
-
blk.7.attn_output.weightQ4_0[7168 7168]
-
blk.7.attn_q.weightQ4_0[7168 7168]
-
blk.7.attn_v.weightQ4_0[7168 1024]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_down.weightQ4_0[20480 7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_down.weightQ4_0[20480 7168]
-
blk.8.ffn_gate.weightQ4_0[7168 20480]
-
blk.8.ffn_up.weightQ4_0[7168 20480]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.8.attn_k.weightQ4_0[7168 1024]
-
blk.8.attn_output.weightQ4_0[7168 7168]
-
blk.8.attn_q.weightQ4_0[7168 7168]
-
blk.8.attn_v.weightQ4_0[7168 1024]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_down.weightQ4_0[20480 7168]
-
blk.9.ffn_gate.weightQ4_0[7168 20480]
-
blk.9.ffn_up.weightQ4_0[7168 20480]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.9.attn_k.weightQ4_0[7168 1024]
-
blk.9.attn_output.weightQ4_0[7168 7168]
-
blk.9.attn_q.weightQ4_0[7168 7168]
-
blk.9.attn_v.weightQ4_0[7168 1024]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_down.weightQ4_0[20480 7168]
-
blk.10.ffn_gate.weightQ4_0[7168 20480]
-
blk.10.ffn_up.weightQ4_0[7168 20480]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.10.attn_k.weightQ4_0[7168 1024]
-
blk.10.attn_output.weightQ4_0[7168 7168]
-
blk.10.attn_q.weightQ4_0[7168 7168]
-
blk.10.attn_v.weightQ4_0[7168 1024]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_down.weightQ4_0[20480 7168]
-
blk.11.ffn_gate.weightQ4_0[7168 20480]
-
blk.11.ffn_up.weightQ4_0[7168 20480]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.11.attn_k.weightQ4_0[7168 1024]
-
blk.11.attn_output.weightQ4_0[7168 7168]
-
blk.11.attn_q.weightQ4_0[7168 7168]
-
blk.11.attn_v.weightQ4_0[7168 1024]
-
blk.12.attn_k.weightQ4_0[7168 1024]
-
blk.12.attn_output.weightQ4_0[7168 7168]
-
blk.12.attn_q.weightQ4_0[7168 7168]
-
blk.12.attn_v.weightQ4_0[7168 1024]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_down.weightQ4_0[20480 7168]
-
blk.12.ffn_gate.weightQ4_0[7168 20480]
-
blk.12.ffn_up.weightQ4_0[7168 20480]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_down.weightQ4_0[20480 7168]
-
blk.13.ffn_gate.weightQ4_0[7168 20480]
-
blk.13.ffn_up.weightQ4_0[7168 20480]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.13.attn_k.weightQ4_0[7168 1024]
-
blk.13.attn_output.weightQ4_0[7168 7168]
-
blk.13.attn_q.weightQ4_0[7168 7168]
-
blk.13.attn_v.weightQ4_0[7168 1024]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_down.weightQ4_0[20480 7168]
-
blk.14.ffn_gate.weightQ4_0[7168 20480]
-
blk.14.ffn_up.weightQ4_0[7168 20480]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.14.attn_k.weightQ4_0[7168 1024]
-
blk.14.attn_output.weightQ4_0[7168 7168]
-
blk.14.attn_q.weightQ4_0[7168 7168]
-
blk.14.attn_v.weightQ4_0[7168 1024]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_down.weightQ4_0[20480 7168]
-
blk.15.ffn_gate.weightQ4_0[7168 20480]
-
blk.15.ffn_up.weightQ4_0[7168 20480]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.15.attn_k.weightQ4_0[7168 1024]
-
blk.15.attn_output.weightQ4_0[7168 7168]
-
blk.15.attn_q.weightQ4_0[7168 7168]
-
blk.15.attn_v.weightQ4_0[7168 1024]
-
blk.16.ffn_gate.weightQ4_0[7168 20480]
-
blk.16.attn_k.weightQ4_0[7168 1024]
-
blk.16.attn_output.weightQ4_0[7168 7168]
-
blk.16.attn_q.weightQ4_0[7168 7168]
-
blk.16.attn_v.weightQ4_0[7168 1024]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_down.weightQ4_0[20480 7168]
-
blk.16.ffn_up.weightQ4_0[7168 20480]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_down.weightQ4_0[20480 7168]
-
blk.17.ffn_gate.weightQ4_0[7168 20480]
-
blk.17.ffn_up.weightQ4_0[7168 20480]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.17.attn_k.weightQ4_0[7168 1024]
-
blk.17.attn_output.weightQ4_0[7168 7168]
-
blk.17.attn_q.weightQ4_0[7168 7168]
-
blk.17.attn_v.weightQ4_0[7168 1024]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_down.weightQ4_0[20480 7168]
-
blk.18.ffn_gate.weightQ4_0[7168 20480]
-
blk.18.ffn_up.weightQ4_0[7168 20480]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.18.attn_k.weightQ4_0[7168 1024]
-
blk.18.attn_output.weightQ4_0[7168 7168]
-
blk.18.attn_q.weightQ4_0[7168 7168]
-
blk.18.attn_v.weightQ4_0[7168 1024]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_down.weightQ4_0[20480 7168]
-
blk.19.ffn_gate.weightQ4_0[7168 20480]
-
blk.19.ffn_up.weightQ4_0[7168 20480]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.19.attn_k.weightQ4_0[7168 1024]
-
blk.19.attn_output.weightQ4_0[7168 7168]
-
blk.19.attn_q.weightQ4_0[7168 7168]
-
blk.19.attn_v.weightQ4_0[7168 1024]
-
blk.20.ffn_gate.weightQ4_0[7168 20480]
-
blk.20.ffn_up.weightQ4_0[7168 20480]
-
blk.20.attn_k.weightQ4_0[7168 1024]
-
blk.20.attn_output.weightQ4_0[7168 7168]
-
blk.20.attn_q.weightQ4_0[7168 7168]
-
blk.20.attn_v.weightQ4_0[7168 1024]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_down.weightQ4_0[20480 7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_down.weightQ4_0[20480 7168]
-
blk.21.ffn_gate.weightQ4_0[7168 20480]
-
blk.21.ffn_up.weightQ4_0[7168 20480]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.21.attn_k.weightQ4_0[7168 1024]
-
blk.21.attn_output.weightQ4_0[7168 7168]
-
blk.21.attn_q.weightQ4_0[7168 7168]
-
blk.21.attn_v.weightQ4_0[7168 1024]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_down.weightQ4_0[20480 7168]
-
blk.22.ffn_gate.weightQ4_0[7168 20480]
-
blk.22.ffn_up.weightQ4_0[7168 20480]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.22.attn_k.weightQ4_0[7168 1024]
-
blk.22.attn_output.weightQ4_0[7168 7168]
-
blk.22.attn_q.weightQ4_0[7168 7168]
-
blk.22.attn_v.weightQ4_0[7168 1024]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_down.weightQ4_0[20480 7168]
-
blk.23.ffn_gate.weightQ4_0[7168 20480]
-
blk.23.ffn_up.weightQ4_0[7168 20480]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.23.attn_k.weightQ4_0[7168 1024]
-
blk.23.attn_output.weightQ4_0[7168 7168]
-
blk.23.attn_q.weightQ4_0[7168 7168]
-
blk.23.attn_v.weightQ4_0[7168 1024]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_down.weightQ4_0[20480 7168]
-
blk.24.ffn_gate.weightQ4_0[7168 20480]
-
blk.24.ffn_up.weightQ4_0[7168 20480]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.24.attn_k.weightQ4_0[7168 1024]
-
blk.24.attn_output.weightQ4_0[7168 7168]
-
blk.24.attn_q.weightQ4_0[7168 7168]
-
blk.24.attn_v.weightQ4_0[7168 1024]
-
blk.25.attn_k.weightQ4_0[7168 1024]
-
blk.25.attn_output.weightQ4_0[7168 7168]
-
blk.25.attn_q.weightQ4_0[7168 7168]
-
blk.25.attn_v.weightQ4_0[7168 1024]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_down.weightQ4_0[20480 7168]
-
blk.25.ffn_gate.weightQ4_0[7168 20480]
-
blk.25.ffn_up.weightQ4_0[7168 20480]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_down.weightQ4_0[20480 7168]
-
blk.26.ffn_gate.weightQ4_0[7168 20480]
-
blk.26.ffn_up.weightQ4_0[7168 20480]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.26.attn_k.weightQ4_0[7168 1024]
-
blk.26.attn_output.weightQ4_0[7168 7168]
-
blk.26.attn_q.weightQ4_0[7168 7168]
-
blk.26.attn_v.weightQ4_0[7168 1024]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_down.weightQ4_0[20480 7168]
-
blk.27.ffn_gate.weightQ4_0[7168 20480]
-
blk.27.ffn_up.weightQ4_0[7168 20480]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.27.attn_k.weightQ4_0[7168 1024]
-
blk.27.attn_output.weightQ4_0[7168 7168]
-
blk.27.attn_q.weightQ4_0[7168 7168]
-
blk.27.attn_v.weightQ4_0[7168 1024]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_down.weightQ4_0[20480 7168]
-
blk.28.ffn_gate.weightQ4_0[7168 20480]
-
blk.28.ffn_up.weightQ4_0[7168 20480]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.28.attn_k.weightQ4_0[7168 1024]
-
blk.28.attn_output.weightQ4_0[7168 7168]
-
blk.28.attn_q.weightQ4_0[7168 7168]
-
blk.28.attn_v.weightQ4_0[7168 1024]
-
blk.29.ffn_gate.weightQ4_0[7168 20480]
-
blk.29.attn_k.weightQ4_0[7168 1024]
-
blk.29.attn_output.weightQ4_0[7168 7168]
-
blk.29.attn_q.weightQ4_0[7168 7168]
-
blk.29.attn_v.weightQ4_0[7168 1024]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_down.weightQ4_0[20480 7168]
-
blk.29.ffn_up.weightQ4_0[7168 20480]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_down.weightQ4_0[20480 7168]
-
blk.30.ffn_gate.weightQ4_0[7168 20480]
-
blk.30.ffn_up.weightQ4_0[7168 20480]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.30.attn_k.weightQ4_0[7168 1024]
-
blk.30.attn_output.weightQ4_0[7168 7168]
-
blk.30.attn_q.weightQ4_0[7168 7168]
-
blk.30.attn_v.weightQ4_0[7168 1024]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_down.weightQ4_0[20480 7168]
-
blk.31.ffn_gate.weightQ4_0[7168 20480]
-
blk.31.ffn_up.weightQ4_0[7168 20480]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.31.attn_k.weightQ4_0[7168 1024]
-
blk.31.attn_output.weightQ4_0[7168 7168]
-
blk.31.attn_q.weightQ4_0[7168 7168]
-
blk.31.attn_v.weightQ4_0[7168 1024]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_down.weightQ4_0[20480 7168]
-
blk.32.ffn_gate.weightQ4_0[7168 20480]
-
blk.32.ffn_up.weightQ4_0[7168 20480]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.32.attn_k.weightQ4_0[7168 1024]
-
blk.32.attn_output.weightQ4_0[7168 7168]
-
blk.32.attn_q.weightQ4_0[7168 7168]
-
blk.32.attn_v.weightQ4_0[7168 1024]
-
blk.33.ffn_gate.weightQ4_0[7168 20480]
-
blk.33.ffn_up.weightQ4_0[7168 20480]
-
blk.33.attn_k.weightQ4_0[7168 1024]
-
blk.33.attn_output.weightQ4_0[7168 7168]
-
blk.33.attn_q.weightQ4_0[7168 7168]
-
blk.33.attn_v.weightQ4_0[7168 1024]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_down.weightQ4_0[20480 7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_down.weightQ4_0[20480 7168]
-
blk.34.ffn_gate.weightQ4_0[7168 20480]
-
blk.34.ffn_up.weightQ4_0[7168 20480]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.34.attn_k.weightQ4_0[7168 1024]
-
blk.34.attn_output.weightQ4_0[7168 7168]
-
blk.34.attn_q.weightQ4_0[7168 7168]
-
blk.34.attn_v.weightQ4_0[7168 1024]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_down.weightQ4_0[20480 7168]
-
blk.35.ffn_gate.weightQ4_0[7168 20480]
-
blk.35.ffn_up.weightQ4_0[7168 20480]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.35.attn_k.weightQ4_0[7168 1024]
-
blk.35.attn_output.weightQ4_0[7168 7168]
-
blk.35.attn_q.weightQ4_0[7168 7168]
-
blk.35.attn_v.weightQ4_0[7168 1024]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_down.weightQ4_0[20480 7168]
-
blk.36.ffn_gate.weightQ4_0[7168 20480]
-
blk.36.ffn_up.weightQ4_0[7168 20480]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.36.attn_k.weightQ4_0[7168 1024]
-
blk.36.attn_output.weightQ4_0[7168 7168]
-
blk.36.attn_q.weightQ4_0[7168 7168]
-
blk.36.attn_v.weightQ4_0[7168 1024]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_down.weightQ4_0[20480 7168]
-
blk.37.ffn_gate.weightQ4_0[7168 20480]
-
blk.37.ffn_up.weightQ4_0[7168 20480]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.37.attn_k.weightQ4_0[7168 1024]
-
blk.37.attn_output.weightQ4_0[7168 7168]
-
blk.37.attn_q.weightQ4_0[7168 7168]
-
blk.37.attn_v.weightQ4_0[7168 1024]
-
blk.38.attn_k.weightQ4_0[7168 1024]
-
blk.38.attn_output.weightQ4_0[7168 7168]
-
blk.38.attn_q.weightQ4_0[7168 7168]
-
blk.38.attn_v.weightQ4_0[7168 1024]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_down.weightQ4_0[20480 7168]
-
blk.38.ffn_gate.weightQ4_0[7168 20480]
-
blk.38.ffn_up.weightQ4_0[7168 20480]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_down.weightQ4_0[20480 7168]
-
blk.39.ffn_gate.weightQ4_0[7168 20480]
-
blk.39.ffn_up.weightQ4_0[7168 20480]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.39.attn_k.weightQ4_0[7168 1024]
-
blk.39.attn_output.weightQ4_0[7168 7168]
-
blk.39.attn_q.weightQ4_0[7168 7168]
-
blk.39.attn_v.weightQ4_0[7168 1024]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_down.weightQ4_0[20480 7168]
-
blk.40.ffn_gate.weightQ4_0[7168 20480]
-
blk.40.ffn_up.weightQ4_0[7168 20480]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.40.attn_k.weightQ4_0[7168 1024]
-
blk.40.attn_output.weightQ4_0[7168 7168]
-
blk.40.attn_q.weightQ4_0[7168 7168]
-
blk.40.attn_v.weightQ4_0[7168 1024]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_down.weightQ4_0[20480 7168]
-
blk.41.ffn_gate.weightQ4_0[7168 20480]
-
blk.41.ffn_up.weightQ4_0[7168 20480]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.41.attn_k.weightQ4_0[7168 1024]
-
blk.41.attn_output.weightQ4_0[7168 7168]
-
blk.41.attn_q.weightQ4_0[7168 7168]
-
blk.41.attn_v.weightQ4_0[7168 1024]
-
blk.42.ffn_gate.weightQ4_0[7168 20480]
-
blk.42.attn_k.weightQ4_0[7168 1024]
-
blk.42.attn_output.weightQ4_0[7168 7168]
-
blk.42.attn_q.weightQ4_0[7168 7168]
-
blk.42.attn_v.weightQ4_0[7168 1024]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_down.weightQ4_0[20480 7168]
-
blk.42.ffn_up.weightQ4_0[7168 20480]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_down.weightQ4_0[20480 7168]
-
blk.43.ffn_gate.weightQ4_0[7168 20480]
-
blk.43.ffn_up.weightQ4_0[7168 20480]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.43.attn_k.weightQ4_0[7168 1024]
-
blk.43.attn_output.weightQ4_0[7168 7168]
-
blk.43.attn_q.weightQ4_0[7168 7168]
-
blk.43.attn_v.weightQ4_0[7168 1024]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_down.weightQ4_0[20480 7168]
-
blk.44.ffn_gate.weightQ4_0[7168 20480]
-
blk.44.ffn_up.weightQ4_0[7168 20480]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.44.attn_k.weightQ4_0[7168 1024]
-
blk.44.attn_output.weightQ4_0[7168 7168]
-
blk.44.attn_q.weightQ4_0[7168 7168]
-
blk.44.attn_v.weightQ4_0[7168 1024]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_down.weightQ4_0[20480 7168]
-
blk.45.ffn_gate.weightQ4_0[7168 20480]
-
blk.45.ffn_up.weightQ4_0[7168 20480]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.45.attn_k.weightQ4_0[7168 1024]
-
blk.45.attn_output.weightQ4_0[7168 7168]
-
blk.45.attn_q.weightQ4_0[7168 7168]
-
blk.45.attn_v.weightQ4_0[7168 1024]
-
blk.46.ffn_gate.weightQ4_0[7168 20480]
-
blk.46.ffn_up.weightQ4_0[7168 20480]
-
blk.46.attn_k.weightQ4_0[7168 1024]
-
blk.46.attn_output.weightQ4_0[7168 7168]
-
blk.46.attn_q.weightQ4_0[7168 7168]
-
blk.46.attn_v.weightQ4_0[7168 1024]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_down.weightQ4_0[20480 7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_down.weightQ4_0[20480 7168]
-
blk.47.ffn_gate.weightQ4_0[7168 20480]
-
blk.47.ffn_up.weightQ4_0[7168 20480]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.47.attn_k.weightQ4_0[7168 1024]
-
blk.47.attn_output.weightQ4_0[7168 7168]
-
blk.47.attn_q.weightQ4_0[7168 7168]
-
blk.47.attn_v.weightQ4_0[7168 1024]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_down.weightQ4_0[20480 7168]
-
blk.48.ffn_gate.weightQ4_0[7168 20480]
-
blk.48.ffn_up.weightQ4_0[7168 20480]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.48.attn_k.weightQ4_0[7168 1024]
-
blk.48.attn_output.weightQ4_0[7168 7168]
-
blk.48.attn_q.weightQ4_0[7168 7168]
-
blk.48.attn_v.weightQ4_0[7168 1024]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_down.weightQ4_0[20480 7168]
-
blk.49.ffn_gate.weightQ4_0[7168 20480]
-
blk.49.ffn_up.weightQ4_0[7168 20480]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.49.attn_k.weightQ4_0[7168 1024]
-
blk.49.attn_output.weightQ4_0[7168 7168]
-
blk.49.attn_q.weightQ4_0[7168 7168]
-
blk.49.attn_v.weightQ4_0[7168 1024]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_down.weightQ4_0[20480 7168]
-
blk.50.ffn_gate.weightQ4_0[7168 20480]
-
blk.50.ffn_up.weightQ4_0[7168 20480]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.50.attn_k.weightQ4_0[7168 1024]
-
blk.50.attn_output.weightQ4_0[7168 7168]
-
blk.50.attn_q.weightQ4_0[7168 7168]
-
blk.50.attn_v.weightQ4_0[7168 1024]
-
blk.51.attn_k.weightQ4_0[7168 1024]
-
blk.51.attn_output.weightQ4_0[7168 7168]
-
blk.51.attn_q.weightQ4_0[7168 7168]
-
blk.51.attn_v.weightQ4_0[7168 1024]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_down.weightQ4_0[20480 7168]
-
blk.51.ffn_gate.weightQ4_0[7168 20480]
-
blk.51.ffn_up.weightQ4_0[7168 20480]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_down.weightQ4_0[20480 7168]
-
blk.52.ffn_gate.weightQ4_0[7168 20480]
-
blk.52.ffn_up.weightQ4_0[7168 20480]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.52.attn_k.weightQ4_0[7168 1024]
-
blk.52.attn_output.weightQ4_0[7168 7168]
-
blk.52.attn_q.weightQ4_0[7168 7168]
-
blk.52.attn_v.weightQ4_0[7168 1024]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_down.weightQ4_0[20480 7168]
-
blk.53.ffn_gate.weightQ4_0[7168 20480]
-
blk.53.ffn_up.weightQ4_0[7168 20480]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.53.attn_k.weightQ4_0[7168 1024]
-
blk.53.attn_output.weightQ4_0[7168 7168]
-
blk.53.attn_q.weightQ4_0[7168 7168]
-
blk.53.attn_v.weightQ4_0[7168 1024]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_down.weightQ4_0[20480 7168]
-
blk.54.ffn_gate.weightQ4_0[7168 20480]
-
blk.54.ffn_up.weightQ4_0[7168 20480]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.54.attn_k.weightQ4_0[7168 1024]
-
blk.54.attn_output.weightQ4_0[7168 7168]
-
blk.54.attn_q.weightQ4_0[7168 7168]
-
blk.54.attn_v.weightQ4_0[7168 1024]
-
blk.55.ffn_gate.weightQ4_0[7168 20480]
-
blk.55.attn_k.weightQ4_0[7168 1024]
-
blk.55.attn_output.weightQ4_0[7168 7168]
-
blk.55.attn_q.weightQ4_0[7168 7168]
-
blk.55.attn_v.weightQ4_0[7168 1024]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_down.weightQ4_0[20480 7168]
-
blk.55.ffn_up.weightQ4_0[7168 20480]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_down.weightQ4_0[20480 7168]
-
blk.56.ffn_gate.weightQ4_0[7168 20480]
-
blk.56.ffn_up.weightQ4_0[7168 20480]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.56.attn_k.weightQ4_0[7168 1024]
-
blk.56.attn_output.weightQ4_0[7168 7168]
-
blk.56.attn_q.weightQ4_0[7168 7168]
-
blk.56.attn_v.weightQ4_0[7168 1024]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_down.weightQ4_0[20480 7168]
-
blk.57.ffn_gate.weightQ4_0[7168 20480]
-
blk.57.ffn_up.weightQ4_0[7168 20480]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.57.attn_k.weightQ4_0[7168 1024]
-
blk.57.attn_output.weightQ4_0[7168 7168]
-
blk.57.attn_q.weightQ4_0[7168 7168]
-
blk.57.attn_v.weightQ4_0[7168 1024]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_down.weightQ4_0[20480 7168]
-
blk.58.ffn_gate.weightQ4_0[7168 20480]
-
blk.58.ffn_up.weightQ4_0[7168 20480]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.58.attn_k.weightQ4_0[7168 1024]
-
blk.58.attn_output.weightQ4_0[7168 7168]
-
blk.58.attn_q.weightQ4_0[7168 7168]
-
blk.58.attn_v.weightQ4_0[7168 1024]
-
blk.59.ffn_gate.weightQ4_0[7168 20480]
-
blk.59.ffn_up.weightQ4_0[7168 20480]
-
blk.59.attn_k.weightQ4_0[7168 1024]
-
blk.59.attn_output.weightQ4_0[7168 7168]
-
blk.59.attn_q.weightQ4_0[7168 7168]
-
blk.59.attn_v.weightQ4_0[7168 1024]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_down.weightQ4_0[20480 7168]
-
blk.59.ffn_norm.weightF32[7168]
-
output.weightQ6_K[7168 64000]
-
output_norm.weightF32[7168]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59