latest
13GB
Tools
22B
Updated yesterday
7f39b4b7da05 · 13GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count56
-
llama.context_length131072
-
llama.embedding_length6144
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32768
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[6144 32768]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_down.weightQ6_K[16384 6144]
-
blk.0.ffn_gate.weightQ4_K[6144 16384]
-
blk.0.ffn_up.weightQ4_K[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.attn_k.weightQ4_K[6144 1024]
-
blk.0.attn_output.weightQ4_K[6144 6144]
-
blk.0.attn_q.weightQ4_K[6144 6144]
-
blk.0.attn_v.weightQ6_K[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_down.weightQ6_K[16384 6144]
-
blk.1.ffn_gate.weightQ4_K[6144 16384]
-
blk.1.ffn_up.weightQ4_K[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.attn_k.weightQ4_K[6144 1024]
-
blk.1.attn_output.weightQ4_K[6144 6144]
-
blk.1.attn_q.weightQ4_K[6144 6144]
-
blk.1.attn_v.weightQ6_K[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_down.weightQ6_K[16384 6144]
-
blk.2.ffn_gate.weightQ4_K[6144 16384]
-
blk.2.ffn_up.weightQ4_K[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.attn_k.weightQ4_K[6144 1024]
-
blk.2.attn_output.weightQ4_K[6144 6144]
-
blk.2.attn_q.weightQ4_K[6144 6144]
-
blk.2.attn_v.weightQ6_K[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_down.weightQ6_K[16384 6144]
-
blk.3.ffn_gate.weightQ4_K[6144 16384]
-
blk.3.ffn_up.weightQ4_K[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.attn_k.weightQ4_K[6144 1024]
-
blk.3.attn_output.weightQ4_K[6144 6144]
-
blk.3.attn_q.weightQ4_K[6144 6144]
-
blk.3.attn_v.weightQ6_K[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_down.weightQ6_K[16384 6144]
-
blk.4.ffn_gate.weightQ4_K[6144 16384]
-
blk.4.ffn_up.weightQ4_K[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.attn_k.weightQ4_K[6144 1024]
-
blk.4.attn_output.weightQ4_K[6144 6144]
-
blk.4.attn_q.weightQ4_K[6144 6144]
-
blk.4.attn_v.weightQ6_K[6144 1024]
-
blk.5.ffn_gate.weightQ4_K[6144 16384]
-
blk.5.ffn_up.weightQ4_K[6144 16384]
-
blk.5.attn_k.weightQ4_K[6144 1024]
-
blk.5.attn_output.weightQ4_K[6144 6144]
-
blk.5.attn_q.weightQ4_K[6144 6144]
-
blk.5.attn_v.weightQ6_K[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_down.weightQ4_K[16384 6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_down.weightQ4_K[16384 6144]
-
blk.6.ffn_gate.weightQ4_K[6144 16384]
-
blk.6.ffn_up.weightQ4_K[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.attn_k.weightQ4_K[6144 1024]
-
blk.6.attn_output.weightQ4_K[6144 6144]
-
blk.6.attn_q.weightQ4_K[6144 6144]
-
blk.6.attn_v.weightQ6_K[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_down.weightQ6_K[16384 6144]
-
blk.7.ffn_gate.weightQ4_K[6144 16384]
-
blk.7.ffn_up.weightQ4_K[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.attn_k.weightQ4_K[6144 1024]
-
blk.7.attn_output.weightQ4_K[6144 6144]
-
blk.7.attn_q.weightQ4_K[6144 6144]
-
blk.7.attn_v.weightQ4_K[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_down.weightQ4_K[16384 6144]
-
blk.8.ffn_gate.weightQ4_K[6144 16384]
-
blk.8.ffn_up.weightQ4_K[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.attn_k.weightQ4_K[6144 1024]
-
blk.8.attn_output.weightQ4_K[6144 6144]
-
blk.8.attn_q.weightQ4_K[6144 6144]
-
blk.8.attn_v.weightQ4_K[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_down.weightQ4_K[16384 6144]
-
blk.9.ffn_gate.weightQ4_K[6144 16384]
-
blk.9.ffn_up.weightQ4_K[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.attn_k.weightQ4_K[6144 1024]
-
blk.9.attn_output.weightQ4_K[6144 6144]
-
blk.9.attn_q.weightQ4_K[6144 6144]
-
blk.9.attn_v.weightQ6_K[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_down.weightQ6_K[16384 6144]
-
blk.10.ffn_gate.weightQ4_K[6144 16384]
-
blk.10.ffn_up.weightQ4_K[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.attn_k.weightQ4_K[6144 1024]
-
blk.10.attn_output.weightQ4_K[6144 6144]
-
blk.10.attn_q.weightQ4_K[6144 6144]
-
blk.10.attn_v.weightQ6_K[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_down.weightQ6_K[16384 6144]
-
blk.11.ffn_gate.weightQ4_K[6144 16384]
-
blk.11.ffn_up.weightQ4_K[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.attn_k.weightQ4_K[6144 1024]
-
blk.11.attn_output.weightQ4_K[6144 6144]
-
blk.11.attn_q.weightQ4_K[6144 6144]
-
blk.11.attn_v.weightQ4_K[6144 1024]
-
blk.12.attn_k.weightQ4_K[6144 1024]
-
blk.12.attn_q.weightQ4_K[6144 6144]
-
blk.12.attn_v.weightQ4_K[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_down.weightQ6_K[16384 6144]
-
blk.12.ffn_gate.weightQ4_K[6144 16384]
-
blk.12.ffn_up.weightQ4_K[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.attn_output.weightQ4_K[6144 6144]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_down.weightQ4_K[16384 6144]
-
blk.13.ffn_gate.weightQ4_K[6144 16384]
-
blk.13.ffn_up.weightQ4_K[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.attn_k.weightQ4_K[6144 1024]
-
blk.13.attn_output.weightQ4_K[6144 6144]
-
blk.13.attn_q.weightQ4_K[6144 6144]
-
blk.13.attn_v.weightQ4_K[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_down.weightQ4_K[16384 6144]
-
blk.14.ffn_gate.weightQ4_K[6144 16384]
-
blk.14.ffn_up.weightQ4_K[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.attn_k.weightQ4_K[6144 1024]
-
blk.14.attn_output.weightQ4_K[6144 6144]
-
blk.14.attn_q.weightQ4_K[6144 6144]
-
blk.14.attn_v.weightQ4_K[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_down.weightQ6_K[16384 6144]
-
blk.15.ffn_gate.weightQ4_K[6144 16384]
-
blk.15.ffn_up.weightQ4_K[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.attn_k.weightQ4_K[6144 1024]
-
blk.15.attn_output.weightQ4_K[6144 6144]
-
blk.15.attn_q.weightQ4_K[6144 6144]
-
blk.15.attn_v.weightQ6_K[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_down.weightQ4_K[16384 6144]
-
blk.16.ffn_gate.weightQ4_K[6144 16384]
-
blk.16.ffn_up.weightQ4_K[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.attn_k.weightQ4_K[6144 1024]
-
blk.16.attn_output.weightQ4_K[6144 6144]
-
blk.16.attn_q.weightQ4_K[6144 6144]
-
blk.16.attn_v.weightQ4_K[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_down.weightQ4_K[16384 6144]
-
blk.17.ffn_gate.weightQ4_K[6144 16384]
-
blk.17.ffn_up.weightQ4_K[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.attn_k.weightQ4_K[6144 1024]
-
blk.17.attn_output.weightQ4_K[6144 6144]
-
blk.17.attn_q.weightQ4_K[6144 6144]
-
blk.17.attn_v.weightQ4_K[6144 1024]
-
blk.18.ffn_gate.weightQ4_K[6144 16384]
-
blk.18.attn_k.weightQ4_K[6144 1024]
-
blk.18.attn_output.weightQ4_K[6144 6144]
-
blk.18.attn_q.weightQ4_K[6144 6144]
-
blk.18.attn_v.weightQ6_K[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.weightQ6_K[16384 6144]
-
blk.18.ffn_up.weightQ4_K[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_down.weightQ4_K[16384 6144]
-
blk.19.ffn_gate.weightQ4_K[6144 16384]
-
blk.19.ffn_up.weightQ4_K[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.attn_k.weightQ4_K[6144 1024]
-
blk.19.attn_output.weightQ4_K[6144 6144]
-
blk.19.attn_q.weightQ4_K[6144 6144]
-
blk.19.attn_v.weightQ4_K[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_down.weightQ4_K[16384 6144]
-
blk.20.ffn_gate.weightQ4_K[6144 16384]
-
blk.20.ffn_up.weightQ4_K[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.attn_k.weightQ4_K[6144 1024]
-
blk.20.attn_output.weightQ4_K[6144 6144]
-
blk.20.attn_q.weightQ4_K[6144 6144]
-
blk.20.attn_v.weightQ4_K[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_down.weightQ6_K[16384 6144]
-
blk.21.ffn_gate.weightQ4_K[6144 16384]
-
blk.21.ffn_up.weightQ4_K[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.attn_k.weightQ4_K[6144 1024]
-
blk.21.attn_output.weightQ4_K[6144 6144]
-
blk.21.attn_q.weightQ4_K[6144 6144]
-
blk.21.attn_v.weightQ6_K[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_down.weightQ4_K[16384 6144]
-
blk.22.ffn_gate.weightQ4_K[6144 16384]
-
blk.22.ffn_up.weightQ4_K[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.attn_k.weightQ4_K[6144 1024]
-
blk.22.attn_output.weightQ4_K[6144 6144]
-
blk.22.attn_q.weightQ4_K[6144 6144]
-
blk.22.attn_v.weightQ4_K[6144 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_down.weightQ4_K[16384 6144]
-
blk.23.ffn_gate.weightQ4_K[6144 16384]
-
blk.23.ffn_up.weightQ4_K[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_k.weightQ4_K[6144 1024]
-
blk.23.attn_output.weightQ4_K[6144 6144]
-
blk.23.attn_q.weightQ4_K[6144 6144]
-
blk.23.attn_v.weightQ4_K[6144 1024]
-
blk.24.ffn_gate.weightQ4_K[6144 16384]
-
blk.24.ffn_up.weightQ4_K[6144 16384]
-
blk.24.attn_k.weightQ4_K[6144 1024]
-
blk.24.attn_output.weightQ4_K[6144 6144]
-
blk.24.attn_q.weightQ4_K[6144 6144]
-
blk.24.attn_v.weightQ6_K[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_down.weightQ6_K[16384 6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_down.weightQ4_K[16384 6144]
-
blk.25.ffn_gate.weightQ4_K[6144 16384]
-
blk.25.ffn_up.weightQ4_K[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightQ4_K[6144 1024]
-
blk.25.attn_output.weightQ4_K[6144 6144]
-
blk.25.attn_q.weightQ4_K[6144 6144]
-
blk.25.attn_v.weightQ4_K[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_down.weightQ4_K[16384 6144]
-
blk.26.ffn_gate.weightQ4_K[6144 16384]
-
blk.26.ffn_up.weightQ4_K[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.attn_k.weightQ4_K[6144 1024]
-
blk.26.attn_output.weightQ4_K[6144 6144]
-
blk.26.attn_q.weightQ4_K[6144 6144]
-
blk.26.attn_v.weightQ4_K[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_down.weightQ6_K[16384 6144]
-
blk.27.ffn_gate.weightQ4_K[6144 16384]
-
blk.27.ffn_up.weightQ4_K[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.attn_k.weightQ4_K[6144 1024]
-
blk.27.attn_output.weightQ4_K[6144 6144]
-
blk.27.attn_q.weightQ4_K[6144 6144]
-
blk.27.attn_v.weightQ6_K[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_down.weightQ4_K[16384 6144]
-
blk.28.ffn_gate.weightQ4_K[6144 16384]
-
blk.28.ffn_up.weightQ4_K[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.attn_k.weightQ4_K[6144 1024]
-
blk.28.attn_output.weightQ4_K[6144 6144]
-
blk.28.attn_q.weightQ4_K[6144 6144]
-
blk.28.attn_v.weightQ4_K[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_down.weightQ4_K[16384 6144]
-
blk.29.ffn_gate.weightQ4_K[6144 16384]
-
blk.29.ffn_up.weightQ4_K[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.attn_k.weightQ4_K[6144 1024]
-
blk.29.attn_output.weightQ4_K[6144 6144]
-
blk.29.attn_q.weightQ4_K[6144 6144]
-
blk.29.attn_v.weightQ4_K[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_down.weightQ6_K[16384 6144]
-
blk.30.ffn_gate.weightQ4_K[6144 16384]
-
blk.30.ffn_up.weightQ4_K[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.attn_k.weightQ4_K[6144 1024]
-
blk.30.attn_output.weightQ4_K[6144 6144]
-
blk.30.attn_q.weightQ4_K[6144 6144]
-
blk.30.attn_v.weightQ6_K[6144 1024]
-
blk.31.attn_k.weightQ4_K[6144 1024]
-
blk.31.attn_q.weightQ4_K[6144 6144]
-
blk.31.attn_v.weightQ4_K[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_down.weightQ4_K[16384 6144]
-
blk.31.ffn_gate.weightQ4_K[6144 16384]
-
blk.31.ffn_up.weightQ4_K[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.attn_output.weightQ4_K[6144 6144]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_down.weightQ4_K[16384 6144]
-
blk.32.ffn_gate.weightQ4_K[6144 16384]
-
blk.32.ffn_up.weightQ4_K[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.attn_k.weightQ4_K[6144 1024]
-
blk.32.attn_output.weightQ4_K[6144 6144]
-
blk.32.attn_q.weightQ4_K[6144 6144]
-
blk.32.attn_v.weightQ4_K[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_down.weightQ6_K[16384 6144]
-
blk.33.ffn_gate.weightQ4_K[6144 16384]
-
blk.33.ffn_up.weightQ4_K[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.attn_k.weightQ4_K[6144 1024]
-
blk.33.attn_output.weightQ4_K[6144 6144]
-
blk.33.attn_q.weightQ4_K[6144 6144]
-
blk.33.attn_v.weightQ6_K[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_down.weightQ4_K[16384 6144]
-
blk.34.ffn_gate.weightQ4_K[6144 16384]
-
blk.34.ffn_up.weightQ4_K[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.attn_k.weightQ4_K[6144 1024]
-
blk.34.attn_output.weightQ4_K[6144 6144]
-
blk.34.attn_q.weightQ4_K[6144 6144]
-
blk.34.attn_v.weightQ4_K[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_down.weightQ4_K[16384 6144]
-
blk.35.ffn_gate.weightQ4_K[6144 16384]
-
blk.35.ffn_up.weightQ4_K[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.attn_k.weightQ4_K[6144 1024]
-
blk.35.attn_output.weightQ4_K[6144 6144]
-
blk.35.attn_q.weightQ4_K[6144 6144]
-
blk.35.attn_v.weightQ4_K[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_down.weightQ6_K[16384 6144]
-
blk.36.ffn_gate.weightQ4_K[6144 16384]
-
blk.36.ffn_up.weightQ4_K[6144 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.attn_k.weightQ4_K[6144 1024]
-
blk.36.attn_output.weightQ4_K[6144 6144]
-
blk.36.attn_q.weightQ4_K[6144 6144]
-
blk.36.attn_v.weightQ6_K[6144 1024]
-
blk.37.ffn_gate.weightQ4_K[6144 16384]
-
blk.37.attn_k.weightQ4_K[6144 1024]
-
blk.37.attn_output.weightQ4_K[6144 6144]
-
blk.37.attn_q.weightQ4_K[6144 6144]
-
blk.37.attn_v.weightQ4_K[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_down.weightQ4_K[16384 6144]
-
blk.37.ffn_up.weightQ4_K[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_down.weightQ4_K[16384 6144]
-
blk.38.ffn_gate.weightQ4_K[6144 16384]
-
blk.38.ffn_up.weightQ4_K[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.attn_k.weightQ4_K[6144 1024]
-
blk.38.attn_output.weightQ4_K[6144 6144]
-
blk.38.attn_q.weightQ4_K[6144 6144]
-
blk.38.attn_v.weightQ4_K[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_down.weightQ6_K[16384 6144]
-
blk.39.ffn_gate.weightQ4_K[6144 16384]
-
blk.39.ffn_up.weightQ4_K[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.attn_k.weightQ4_K[6144 1024]
-
blk.39.attn_output.weightQ4_K[6144 6144]
-
blk.39.attn_q.weightQ4_K[6144 6144]
-
blk.39.attn_v.weightQ6_K[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_down.weightQ4_K[16384 6144]
-
blk.40.ffn_gate.weightQ4_K[6144 16384]
-
blk.40.ffn_up.weightQ4_K[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.attn_k.weightQ4_K[6144 1024]
-
blk.40.attn_output.weightQ4_K[6144 6144]
-
blk.40.attn_q.weightQ4_K[6144 6144]
-
blk.40.attn_v.weightQ4_K[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_down.weightQ4_K[16384 6144]
-
blk.41.ffn_gate.weightQ4_K[6144 16384]
-
blk.41.ffn_up.weightQ4_K[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.attn_k.weightQ4_K[6144 1024]
-
blk.41.attn_output.weightQ4_K[6144 6144]
-
blk.41.attn_q.weightQ4_K[6144 6144]
-
blk.41.attn_v.weightQ4_K[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_down.weightQ6_K[16384 6144]
-
blk.42.ffn_gate.weightQ4_K[6144 16384]
-
blk.42.ffn_up.weightQ4_K[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.attn_k.weightQ4_K[6144 1024]
-
blk.42.attn_output.weightQ4_K[6144 6144]
-
blk.42.attn_q.weightQ4_K[6144 6144]
-
blk.42.attn_v.weightQ6_K[6144 1024]
-
blk.43.ffn_gate.weightQ4_K[6144 16384]
-
blk.43.ffn_up.weightQ4_K[6144 16384]
-
blk.43.attn_k.weightQ4_K[6144 1024]
-
blk.43.attn_output.weightQ4_K[6144 6144]
-
blk.43.attn_q.weightQ4_K[6144 6144]
-
blk.43.attn_v.weightQ4_K[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_down.weightQ4_K[16384 6144]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_down.weightQ4_K[16384 6144]
-
blk.44.ffn_gate.weightQ4_K[6144 16384]
-
blk.44.ffn_up.weightQ4_K[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.attn_k.weightQ4_K[6144 1024]
-
blk.44.attn_output.weightQ4_K[6144 6144]
-
blk.44.attn_q.weightQ4_K[6144 6144]
-
blk.44.attn_v.weightQ4_K[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_down.weightQ6_K[16384 6144]
-
blk.45.ffn_gate.weightQ4_K[6144 16384]
-
blk.45.ffn_up.weightQ4_K[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.attn_k.weightQ4_K[6144 1024]
-
blk.45.attn_output.weightQ4_K[6144 6144]
-
blk.45.attn_q.weightQ4_K[6144 6144]
-
blk.45.attn_v.weightQ6_K[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_down.weightQ4_K[16384 6144]
-
blk.46.ffn_gate.weightQ4_K[6144 16384]
-
blk.46.ffn_up.weightQ4_K[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.attn_k.weightQ4_K[6144 1024]
-
blk.46.attn_output.weightQ4_K[6144 6144]
-
blk.46.attn_q.weightQ4_K[6144 6144]
-
blk.46.attn_v.weightQ4_K[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_down.weightQ4_K[16384 6144]
-
blk.47.ffn_gate.weightQ4_K[6144 16384]
-
blk.47.ffn_up.weightQ4_K[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.attn_k.weightQ4_K[6144 1024]
-
blk.47.attn_output.weightQ4_K[6144 6144]
-
blk.47.attn_q.weightQ4_K[6144 6144]
-
blk.47.attn_v.weightQ4_K[6144 1024]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_down.weightQ6_K[16384 6144]
-
blk.48.ffn_gate.weightQ4_K[6144 16384]
-
blk.48.ffn_up.weightQ4_K[6144 16384]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.48.attn_k.weightQ4_K[6144 1024]
-
blk.48.attn_output.weightQ4_K[6144 6144]
-
blk.48.attn_q.weightQ4_K[6144 6144]
-
blk.48.attn_v.weightQ6_K[6144 1024]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_down.weightQ6_K[16384 6144]
-
blk.49.ffn_gate.weightQ4_K[6144 16384]
-
blk.49.ffn_up.weightQ4_K[6144 16384]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.49.attn_k.weightQ4_K[6144 1024]
-
blk.49.attn_output.weightQ4_K[6144 6144]
-
blk.49.attn_q.weightQ4_K[6144 6144]
-
blk.49.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_k.weightQ4_K[6144 1024]
-
blk.50.attn_q.weightQ4_K[6144 6144]
-
blk.50.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_down.weightQ6_K[16384 6144]
-
blk.50.ffn_gate.weightQ4_K[6144 16384]
-
blk.50.ffn_up.weightQ4_K[6144 16384]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_output.weightQ4_K[6144 6144]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_down.weightQ6_K[16384 6144]
-
blk.51.ffn_gate.weightQ4_K[6144 16384]
-
blk.51.ffn_up.weightQ4_K[6144 16384]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_k.weightQ4_K[6144 1024]
-
blk.51.attn_output.weightQ4_K[6144 6144]
-
blk.51.attn_q.weightQ4_K[6144 6144]
-
blk.51.attn_v.weightQ6_K[6144 1024]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_down.weightQ6_K[16384 6144]
-
blk.52.ffn_gate.weightQ4_K[6144 16384]
-
blk.52.ffn_up.weightQ4_K[6144 16384]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightQ4_K[6144 1024]
-
blk.52.attn_output.weightQ4_K[6144 6144]
-
blk.52.attn_q.weightQ4_K[6144 6144]
-
blk.52.attn_v.weightQ6_K[6144 1024]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_down.weightQ6_K[16384 6144]
-
blk.53.ffn_gate.weightQ4_K[6144 16384]
-
blk.53.ffn_up.weightQ4_K[6144 16384]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.53.attn_k.weightQ4_K[6144 1024]
-
blk.53.attn_output.weightQ4_K[6144 6144]
-
blk.53.attn_q.weightQ4_K[6144 6144]
-
blk.53.attn_v.weightQ6_K[6144 1024]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_down.weightQ6_K[16384 6144]
-
blk.54.ffn_gate.weightQ4_K[6144 16384]
-
blk.54.ffn_up.weightQ4_K[6144 16384]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.54.attn_k.weightQ4_K[6144 1024]
-
blk.54.attn_output.weightQ4_K[6144 6144]
-
blk.54.attn_q.weightQ4_K[6144 6144]
-
blk.54.attn_v.weightQ6_K[6144 1024]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_down.weightQ6_K[16384 6144]
-
blk.55.ffn_gate.weightQ4_K[6144 16384]
-
blk.55.ffn_up.weightQ4_K[6144 16384]
-
blk.55.ffn_norm.weightF32[6144]
-
blk.55.attn_k.weightQ4_K[6144 1024]
-
blk.55.attn_output.weightQ4_K[6144 6144]
-
blk.55.attn_q.weightQ4_K[6144 6144]
-
blk.55.attn_v.weightQ6_K[6144 1024]
-
output.weightQ6_K[6144 32768]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55