latest
19GB
deepseek-coder-33b-instruct is a 33B parameter model initialized from deepseek-coder-33b-base and fine-tuned on 2B tokens of instruction data.
Tools
33B
20 Pulls Updated 12 days ago
8e468bca4a5e · 19GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count62
-
llama.context_length16384
-
llama.embedding_length7168
-
llama.feed_forward_length19200
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
llama.vocab_size32256
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32021
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.predeepseek-coder
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[7168 32256]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_down.weightQ4_0[19200 7168]
-
blk.0.ffn_gate.weightQ4_0[7168 19200]
-
blk.0.ffn_up.weightQ4_0[7168 19200]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.0.attn_k.weightQ4_0[7168 1024]
-
blk.0.attn_output.weightQ4_0[7168 7168]
-
blk.0.attn_q.weightQ4_0[7168 7168]
-
blk.0.attn_v.weightQ4_0[7168 1024]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_down.weightQ4_0[19200 7168]
-
blk.1.ffn_gate.weightQ4_0[7168 19200]
-
blk.1.ffn_up.weightQ4_0[7168 19200]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.1.attn_k.weightQ4_0[7168 1024]
-
blk.1.attn_output.weightQ4_0[7168 7168]
-
blk.1.attn_q.weightQ4_0[7168 7168]
-
blk.1.attn_v.weightQ4_0[7168 1024]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_down.weightQ4_0[19200 7168]
-
blk.2.ffn_gate.weightQ4_0[7168 19200]
-
blk.2.ffn_up.weightQ4_0[7168 19200]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.2.attn_k.weightQ4_0[7168 1024]
-
blk.2.attn_output.weightQ4_0[7168 7168]
-
blk.2.attn_q.weightQ4_0[7168 7168]
-
blk.2.attn_v.weightQ4_0[7168 1024]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_down.weightQ4_0[19200 7168]
-
blk.3.ffn_gate.weightQ4_0[7168 19200]
-
blk.3.ffn_up.weightQ4_0[7168 19200]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.3.attn_k.weightQ4_0[7168 1024]
-
blk.3.attn_output.weightQ4_0[7168 7168]
-
blk.3.attn_q.weightQ4_0[7168 7168]
-
blk.3.attn_v.weightQ4_0[7168 1024]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_down.weightQ4_0[19200 7168]
-
blk.4.ffn_gate.weightQ4_0[7168 19200]
-
blk.4.ffn_up.weightQ4_0[7168 19200]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.4.attn_k.weightQ4_0[7168 1024]
-
blk.4.attn_output.weightQ4_0[7168 7168]
-
blk.4.attn_q.weightQ4_0[7168 7168]
-
blk.4.attn_v.weightQ4_0[7168 1024]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_down.weightQ4_0[19200 7168]
-
blk.5.ffn_gate.weightQ4_0[7168 19200]
-
blk.5.ffn_up.weightQ4_0[7168 19200]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.5.attn_k.weightQ4_0[7168 1024]
-
blk.5.attn_output.weightQ4_0[7168 7168]
-
blk.5.attn_q.weightQ4_0[7168 7168]
-
blk.5.attn_v.weightQ4_0[7168 1024]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_down.weightQ4_0[19200 7168]
-
blk.6.ffn_gate.weightQ4_0[7168 19200]
-
blk.6.ffn_up.weightQ4_0[7168 19200]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.6.attn_k.weightQ4_0[7168 1024]
-
blk.6.attn_output.weightQ4_0[7168 7168]
-
blk.6.attn_q.weightQ4_0[7168 7168]
-
blk.6.attn_v.weightQ4_0[7168 1024]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_down.weightQ4_0[19200 7168]
-
blk.7.ffn_gate.weightQ4_0[7168 19200]
-
blk.7.ffn_up.weightQ4_0[7168 19200]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.7.attn_k.weightQ4_0[7168 1024]
-
blk.7.attn_output.weightQ4_0[7168 7168]
-
blk.7.attn_q.weightQ4_0[7168 7168]
-
blk.7.attn_v.weightQ4_0[7168 1024]
-
blk.8.ffn_gate.weightQ4_0[7168 19200]
-
blk.8.ffn_up.weightQ4_0[7168 19200]
-
blk.8.attn_k.weightQ4_0[7168 1024]
-
blk.8.attn_output.weightQ4_0[7168 7168]
-
blk.8.attn_q.weightQ4_0[7168 7168]
-
blk.8.attn_v.weightQ4_0[7168 1024]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_down.weightQ4_0[19200 7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_down.weightQ4_0[19200 7168]
-
blk.9.ffn_gate.weightQ4_0[7168 19200]
-
blk.9.ffn_up.weightQ4_0[7168 19200]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.9.attn_k.weightQ4_0[7168 1024]
-
blk.9.attn_output.weightQ4_0[7168 7168]
-
blk.9.attn_q.weightQ4_0[7168 7168]
-
blk.9.attn_v.weightQ4_0[7168 1024]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_down.weightQ4_0[19200 7168]
-
blk.10.ffn_gate.weightQ4_0[7168 19200]
-
blk.10.ffn_up.weightQ4_0[7168 19200]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.10.attn_k.weightQ4_0[7168 1024]
-
blk.10.attn_output.weightQ4_0[7168 7168]
-
blk.10.attn_q.weightQ4_0[7168 7168]
-
blk.10.attn_v.weightQ4_0[7168 1024]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_down.weightQ4_0[19200 7168]
-
blk.11.ffn_gate.weightQ4_0[7168 19200]
-
blk.11.ffn_up.weightQ4_0[7168 19200]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.11.attn_k.weightQ4_0[7168 1024]
-
blk.11.attn_output.weightQ4_0[7168 7168]
-
blk.11.attn_q.weightQ4_0[7168 7168]
-
blk.11.attn_v.weightQ4_0[7168 1024]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_down.weightQ4_0[19200 7168]
-
blk.12.ffn_gate.weightQ4_0[7168 19200]
-
blk.12.ffn_up.weightQ4_0[7168 19200]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.12.attn_k.weightQ4_0[7168 1024]
-
blk.12.attn_output.weightQ4_0[7168 7168]
-
blk.12.attn_q.weightQ4_0[7168 7168]
-
blk.12.attn_v.weightQ4_0[7168 1024]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_down.weightQ4_0[19200 7168]
-
blk.13.ffn_gate.weightQ4_0[7168 19200]
-
blk.13.ffn_up.weightQ4_0[7168 19200]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.13.attn_k.weightQ4_0[7168 1024]
-
blk.13.attn_output.weightQ4_0[7168 7168]
-
blk.13.attn_q.weightQ4_0[7168 7168]
-
blk.13.attn_v.weightQ4_0[7168 1024]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_down.weightQ4_0[19200 7168]
-
blk.14.ffn_gate.weightQ4_0[7168 19200]
-
blk.14.ffn_up.weightQ4_0[7168 19200]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.14.attn_k.weightQ4_0[7168 1024]
-
blk.14.attn_output.weightQ4_0[7168 7168]
-
blk.14.attn_q.weightQ4_0[7168 7168]
-
blk.14.attn_v.weightQ4_0[7168 1024]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_down.weightQ4_0[19200 7168]
-
blk.15.ffn_gate.weightQ4_0[7168 19200]
-
blk.15.ffn_up.weightQ4_0[7168 19200]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.15.attn_k.weightQ4_0[7168 1024]
-
blk.15.attn_output.weightQ4_0[7168 7168]
-
blk.15.attn_q.weightQ4_0[7168 7168]
-
blk.15.attn_v.weightQ4_0[7168 1024]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_down.weightQ4_0[19200 7168]
-
blk.16.ffn_gate.weightQ4_0[7168 19200]
-
blk.16.ffn_up.weightQ4_0[7168 19200]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.16.attn_k.weightQ4_0[7168 1024]
-
blk.16.attn_output.weightQ4_0[7168 7168]
-
blk.16.attn_q.weightQ4_0[7168 7168]
-
blk.16.attn_v.weightQ4_0[7168 1024]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_down.weightQ4_0[19200 7168]
-
blk.17.ffn_gate.weightQ4_0[7168 19200]
-
blk.17.ffn_up.weightQ4_0[7168 19200]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.17.attn_k.weightQ4_0[7168 1024]
-
blk.17.attn_output.weightQ4_0[7168 7168]
-
blk.17.attn_q.weightQ4_0[7168 7168]
-
blk.17.attn_v.weightQ4_0[7168 1024]
-
blk.18.attn_k.weightQ4_0[7168 1024]
-
blk.18.attn_q.weightQ4_0[7168 7168]
-
blk.18.attn_v.weightQ4_0[7168 1024]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_down.weightQ4_0[19200 7168]
-
blk.18.ffn_gate.weightQ4_0[7168 19200]
-
blk.18.ffn_up.weightQ4_0[7168 19200]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.18.attn_output.weightQ4_0[7168 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_down.weightQ4_0[19200 7168]
-
blk.19.ffn_gate.weightQ4_0[7168 19200]
-
blk.19.ffn_up.weightQ4_0[7168 19200]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.19.attn_k.weightQ4_0[7168 1024]
-
blk.19.attn_output.weightQ4_0[7168 7168]
-
blk.19.attn_q.weightQ4_0[7168 7168]
-
blk.19.attn_v.weightQ4_0[7168 1024]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_down.weightQ4_0[19200 7168]
-
blk.20.ffn_gate.weightQ4_0[7168 19200]
-
blk.20.ffn_up.weightQ4_0[7168 19200]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.20.attn_k.weightQ4_0[7168 1024]
-
blk.20.attn_output.weightQ4_0[7168 7168]
-
blk.20.attn_q.weightQ4_0[7168 7168]
-
blk.20.attn_v.weightQ4_0[7168 1024]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_down.weightQ4_0[19200 7168]
-
blk.21.ffn_gate.weightQ4_0[7168 19200]
-
blk.21.ffn_up.weightQ4_0[7168 19200]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.21.attn_k.weightQ4_0[7168 1024]
-
blk.21.attn_output.weightQ4_0[7168 7168]
-
blk.21.attn_q.weightQ4_0[7168 7168]
-
blk.21.attn_v.weightQ4_0[7168 1024]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_down.weightQ4_0[19200 7168]
-
blk.22.ffn_gate.weightQ4_0[7168 19200]
-
blk.22.ffn_up.weightQ4_0[7168 19200]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.22.attn_k.weightQ4_0[7168 1024]
-
blk.22.attn_output.weightQ4_0[7168 7168]
-
blk.22.attn_q.weightQ4_0[7168 7168]
-
blk.22.attn_v.weightQ4_0[7168 1024]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_down.weightQ4_0[19200 7168]
-
blk.23.ffn_gate.weightQ4_0[7168 19200]
-
blk.23.ffn_up.weightQ4_0[7168 19200]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.23.attn_k.weightQ4_0[7168 1024]
-
blk.23.attn_output.weightQ4_0[7168 7168]
-
blk.23.attn_q.weightQ4_0[7168 7168]
-
blk.23.attn_v.weightQ4_0[7168 1024]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_down.weightQ4_0[19200 7168]
-
blk.24.ffn_gate.weightQ4_0[7168 19200]
-
blk.24.ffn_up.weightQ4_0[7168 19200]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.24.attn_k.weightQ4_0[7168 1024]
-
blk.24.attn_output.weightQ4_0[7168 7168]
-
blk.24.attn_q.weightQ4_0[7168 7168]
-
blk.24.attn_v.weightQ4_0[7168 1024]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_down.weightQ4_0[19200 7168]
-
blk.25.ffn_gate.weightQ4_0[7168 19200]
-
blk.25.ffn_up.weightQ4_0[7168 19200]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.25.attn_k.weightQ4_0[7168 1024]
-
blk.25.attn_output.weightQ4_0[7168 7168]
-
blk.25.attn_q.weightQ4_0[7168 7168]
-
blk.25.attn_v.weightQ4_0[7168 1024]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_down.weightQ4_0[19200 7168]
-
blk.26.ffn_gate.weightQ4_0[7168 19200]
-
blk.26.ffn_up.weightQ4_0[7168 19200]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.26.attn_k.weightQ4_0[7168 1024]
-
blk.26.attn_output.weightQ4_0[7168 7168]
-
blk.26.attn_q.weightQ4_0[7168 7168]
-
blk.26.attn_v.weightQ4_0[7168 1024]
-
blk.27.ffn_gate.weightQ4_0[7168 19200]
-
blk.27.attn_k.weightQ4_0[7168 1024]
-
blk.27.attn_output.weightQ4_0[7168 7168]
-
blk.27.attn_q.weightQ4_0[7168 7168]
-
blk.27.attn_v.weightQ4_0[7168 1024]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_down.weightQ4_0[19200 7168]
-
blk.27.ffn_up.weightQ4_0[7168 19200]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_down.weightQ4_0[19200 7168]
-
blk.28.ffn_gate.weightQ4_0[7168 19200]
-
blk.28.ffn_up.weightQ4_0[7168 19200]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.28.attn_k.weightQ4_0[7168 1024]
-
blk.28.attn_output.weightQ4_0[7168 7168]
-
blk.28.attn_q.weightQ4_0[7168 7168]
-
blk.28.attn_v.weightQ4_0[7168 1024]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_down.weightQ4_0[19200 7168]
-
blk.29.ffn_gate.weightQ4_0[7168 19200]
-
blk.29.ffn_up.weightQ4_0[7168 19200]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.29.attn_k.weightQ4_0[7168 1024]
-
blk.29.attn_output.weightQ4_0[7168 7168]
-
blk.29.attn_q.weightQ4_0[7168 7168]
-
blk.29.attn_v.weightQ4_0[7168 1024]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_down.weightQ4_0[19200 7168]
-
blk.30.ffn_gate.weightQ4_0[7168 19200]
-
blk.30.ffn_up.weightQ4_0[7168 19200]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.30.attn_k.weightQ4_0[7168 1024]
-
blk.30.attn_output.weightQ4_0[7168 7168]
-
blk.30.attn_q.weightQ4_0[7168 7168]
-
blk.30.attn_v.weightQ4_0[7168 1024]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_down.weightQ4_0[19200 7168]
-
blk.31.ffn_gate.weightQ4_0[7168 19200]
-
blk.31.ffn_up.weightQ4_0[7168 19200]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.31.attn_k.weightQ4_0[7168 1024]
-
blk.31.attn_output.weightQ4_0[7168 7168]
-
blk.31.attn_q.weightQ4_0[7168 7168]
-
blk.31.attn_v.weightQ4_0[7168 1024]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_down.weightQ4_0[19200 7168]
-
blk.32.ffn_gate.weightQ4_0[7168 19200]
-
blk.32.ffn_up.weightQ4_0[7168 19200]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.32.attn_k.weightQ4_0[7168 1024]
-
blk.32.attn_output.weightQ4_0[7168 7168]
-
blk.32.attn_q.weightQ4_0[7168 7168]
-
blk.32.attn_v.weightQ4_0[7168 1024]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_down.weightQ4_0[19200 7168]
-
blk.33.ffn_gate.weightQ4_0[7168 19200]
-
blk.33.ffn_up.weightQ4_0[7168 19200]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.33.attn_k.weightQ4_0[7168 1024]
-
blk.33.attn_output.weightQ4_0[7168 7168]
-
blk.33.attn_q.weightQ4_0[7168 7168]
-
blk.33.attn_v.weightQ4_0[7168 1024]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_down.weightQ4_0[19200 7168]
-
blk.34.ffn_gate.weightQ4_0[7168 19200]
-
blk.34.ffn_up.weightQ4_0[7168 19200]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.34.attn_k.weightQ4_0[7168 1024]
-
blk.34.attn_output.weightQ4_0[7168 7168]
-
blk.34.attn_q.weightQ4_0[7168 7168]
-
blk.34.attn_v.weightQ4_0[7168 1024]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_down.weightQ4_0[19200 7168]
-
blk.35.ffn_gate.weightQ4_0[7168 19200]
-
blk.35.ffn_up.weightQ4_0[7168 19200]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.35.attn_k.weightQ4_0[7168 1024]
-
blk.35.attn_output.weightQ4_0[7168 7168]
-
blk.35.attn_q.weightQ4_0[7168 7168]
-
blk.35.attn_v.weightQ4_0[7168 1024]
-
blk.36.ffn_gate.weightQ4_0[7168 19200]
-
blk.36.ffn_up.weightQ4_0[7168 19200]
-
blk.36.attn_k.weightQ4_0[7168 1024]
-
blk.36.attn_output.weightQ4_0[7168 7168]
-
blk.36.attn_q.weightQ4_0[7168 7168]
-
blk.36.attn_v.weightQ4_0[7168 1024]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_down.weightQ4_0[19200 7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_down.weightQ4_0[19200 7168]
-
blk.37.ffn_gate.weightQ4_0[7168 19200]
-
blk.37.ffn_up.weightQ4_0[7168 19200]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.37.attn_k.weightQ4_0[7168 1024]
-
blk.37.attn_output.weightQ4_0[7168 7168]
-
blk.37.attn_q.weightQ4_0[7168 7168]
-
blk.37.attn_v.weightQ4_0[7168 1024]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_down.weightQ4_0[19200 7168]
-
blk.38.ffn_gate.weightQ4_0[7168 19200]
-
blk.38.ffn_up.weightQ4_0[7168 19200]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.38.attn_k.weightQ4_0[7168 1024]
-
blk.38.attn_output.weightQ4_0[7168 7168]
-
blk.38.attn_q.weightQ4_0[7168 7168]
-
blk.38.attn_v.weightQ4_0[7168 1024]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_down.weightQ4_0[19200 7168]
-
blk.39.ffn_gate.weightQ4_0[7168 19200]
-
blk.39.ffn_up.weightQ4_0[7168 19200]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.39.attn_k.weightQ4_0[7168 1024]
-
blk.39.attn_output.weightQ4_0[7168 7168]
-
blk.39.attn_q.weightQ4_0[7168 7168]
-
blk.39.attn_v.weightQ4_0[7168 1024]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_down.weightQ4_0[19200 7168]
-
blk.40.ffn_gate.weightQ4_0[7168 19200]
-
blk.40.ffn_up.weightQ4_0[7168 19200]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.40.attn_k.weightQ4_0[7168 1024]
-
blk.40.attn_output.weightQ4_0[7168 7168]
-
blk.40.attn_q.weightQ4_0[7168 7168]
-
blk.40.attn_v.weightQ4_0[7168 1024]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_down.weightQ4_0[19200 7168]
-
blk.41.ffn_gate.weightQ4_0[7168 19200]
-
blk.41.ffn_up.weightQ4_0[7168 19200]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.41.attn_k.weightQ4_0[7168 1024]
-
blk.41.attn_output.weightQ4_0[7168 7168]
-
blk.41.attn_q.weightQ4_0[7168 7168]
-
blk.41.attn_v.weightQ4_0[7168 1024]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_down.weightQ4_0[19200 7168]
-
blk.42.ffn_gate.weightQ4_0[7168 19200]
-
blk.42.ffn_up.weightQ4_0[7168 19200]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.42.attn_k.weightQ4_0[7168 1024]
-
blk.42.attn_output.weightQ4_0[7168 7168]
-
blk.42.attn_q.weightQ4_0[7168 7168]
-
blk.42.attn_v.weightQ4_0[7168 1024]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_down.weightQ4_0[19200 7168]
-
blk.43.ffn_gate.weightQ4_0[7168 19200]
-
blk.43.ffn_up.weightQ4_0[7168 19200]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.43.attn_k.weightQ4_0[7168 1024]
-
blk.43.attn_output.weightQ4_0[7168 7168]
-
blk.43.attn_q.weightQ4_0[7168 7168]
-
blk.43.attn_v.weightQ4_0[7168 1024]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_down.weightQ4_0[19200 7168]
-
blk.44.ffn_gate.weightQ4_0[7168 19200]
-
blk.44.ffn_up.weightQ4_0[7168 19200]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.44.attn_k.weightQ4_0[7168 1024]
-
blk.44.attn_output.weightQ4_0[7168 7168]
-
blk.44.attn_q.weightQ4_0[7168 7168]
-
blk.44.attn_v.weightQ4_0[7168 1024]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_down.weightQ4_0[19200 7168]
-
blk.45.ffn_gate.weightQ4_0[7168 19200]
-
blk.45.ffn_up.weightQ4_0[7168 19200]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.45.attn_k.weightQ4_0[7168 1024]
-
blk.45.attn_output.weightQ4_0[7168 7168]
-
blk.45.attn_q.weightQ4_0[7168 7168]
-
blk.45.attn_v.weightQ4_0[7168 1024]
-
blk.46.attn_k.weightQ4_0[7168 1024]
-
blk.46.attn_q.weightQ4_0[7168 7168]
-
blk.46.attn_v.weightQ4_0[7168 1024]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_down.weightQ4_0[19200 7168]
-
blk.46.ffn_gate.weightQ4_0[7168 19200]
-
blk.46.ffn_up.weightQ4_0[7168 19200]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.46.attn_output.weightQ4_0[7168 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_down.weightQ4_0[19200 7168]
-
blk.47.ffn_gate.weightQ4_0[7168 19200]
-
blk.47.ffn_up.weightQ4_0[7168 19200]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.47.attn_k.weightQ4_0[7168 1024]
-
blk.47.attn_output.weightQ4_0[7168 7168]
-
blk.47.attn_q.weightQ4_0[7168 7168]
-
blk.47.attn_v.weightQ4_0[7168 1024]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_down.weightQ4_0[19200 7168]
-
blk.48.ffn_gate.weightQ4_0[7168 19200]
-
blk.48.ffn_up.weightQ4_0[7168 19200]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.48.attn_k.weightQ4_0[7168 1024]
-
blk.48.attn_output.weightQ4_0[7168 7168]
-
blk.48.attn_q.weightQ4_0[7168 7168]
-
blk.48.attn_v.weightQ4_0[7168 1024]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_down.weightQ4_0[19200 7168]
-
blk.49.ffn_gate.weightQ4_0[7168 19200]
-
blk.49.ffn_up.weightQ4_0[7168 19200]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.49.attn_k.weightQ4_0[7168 1024]
-
blk.49.attn_output.weightQ4_0[7168 7168]
-
blk.49.attn_q.weightQ4_0[7168 7168]
-
blk.49.attn_v.weightQ4_0[7168 1024]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_down.weightQ4_0[19200 7168]
-
blk.50.ffn_gate.weightQ4_0[7168 19200]
-
blk.50.ffn_up.weightQ4_0[7168 19200]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.50.attn_k.weightQ4_0[7168 1024]
-
blk.50.attn_output.weightQ4_0[7168 7168]
-
blk.50.attn_q.weightQ4_0[7168 7168]
-
blk.50.attn_v.weightQ4_0[7168 1024]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_down.weightQ4_0[19200 7168]
-
blk.51.ffn_gate.weightQ4_0[7168 19200]
-
blk.51.ffn_up.weightQ4_0[7168 19200]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.51.attn_k.weightQ4_0[7168 1024]
-
blk.51.attn_output.weightQ4_0[7168 7168]
-
blk.51.attn_q.weightQ4_0[7168 7168]
-
blk.51.attn_v.weightQ4_0[7168 1024]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_down.weightQ4_0[19200 7168]
-
blk.52.ffn_gate.weightQ4_0[7168 19200]
-
blk.52.ffn_up.weightQ4_0[7168 19200]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.52.attn_k.weightQ4_0[7168 1024]
-
blk.52.attn_output.weightQ4_0[7168 7168]
-
blk.52.attn_q.weightQ4_0[7168 7168]
-
blk.52.attn_v.weightQ4_0[7168 1024]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_down.weightQ4_0[19200 7168]
-
blk.53.ffn_gate.weightQ4_0[7168 19200]
-
blk.53.ffn_up.weightQ4_0[7168 19200]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.53.attn_k.weightQ4_0[7168 1024]
-
blk.53.attn_output.weightQ4_0[7168 7168]
-
blk.53.attn_q.weightQ4_0[7168 7168]
-
blk.53.attn_v.weightQ4_0[7168 1024]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_down.weightQ4_0[19200 7168]
-
blk.54.ffn_gate.weightQ4_0[7168 19200]
-
blk.54.ffn_up.weightQ4_0[7168 19200]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.54.attn_k.weightQ4_0[7168 1024]
-
blk.54.attn_output.weightQ4_0[7168 7168]
-
blk.54.attn_q.weightQ4_0[7168 7168]
-
blk.54.attn_v.weightQ4_0[7168 1024]
-
blk.55.ffn_gate.weightQ4_0[7168 19200]
-
blk.55.attn_k.weightQ4_0[7168 1024]
-
blk.55.attn_output.weightQ4_0[7168 7168]
-
blk.55.attn_q.weightQ4_0[7168 7168]
-
blk.55.attn_v.weightQ4_0[7168 1024]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_down.weightQ4_0[19200 7168]
-
blk.55.ffn_up.weightQ4_0[7168 19200]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_down.weightQ4_0[19200 7168]
-
blk.56.ffn_gate.weightQ4_0[7168 19200]
-
blk.56.ffn_up.weightQ4_0[7168 19200]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.56.attn_k.weightQ4_0[7168 1024]
-
blk.56.attn_output.weightQ4_0[7168 7168]
-
blk.56.attn_q.weightQ4_0[7168 7168]
-
blk.56.attn_v.weightQ4_0[7168 1024]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_down.weightQ4_0[19200 7168]
-
blk.57.ffn_gate.weightQ4_0[7168 19200]
-
blk.57.ffn_up.weightQ4_0[7168 19200]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.57.attn_k.weightQ4_0[7168 1024]
-
blk.57.attn_output.weightQ4_0[7168 7168]
-
blk.57.attn_q.weightQ4_0[7168 7168]
-
blk.57.attn_v.weightQ4_0[7168 1024]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_down.weightQ4_0[19200 7168]
-
blk.58.ffn_gate.weightQ4_0[7168 19200]
-
blk.58.ffn_up.weightQ4_0[7168 19200]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.58.attn_k.weightQ4_0[7168 1024]
-
blk.58.attn_output.weightQ4_0[7168 7168]
-
blk.58.attn_q.weightQ4_0[7168 7168]
-
blk.58.attn_v.weightQ4_0[7168 1024]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_down.weightQ4_0[19200 7168]
-
blk.59.ffn_gate.weightQ4_0[7168 19200]
-
blk.59.ffn_up.weightQ4_0[7168 19200]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.59.attn_k.weightQ4_0[7168 1024]
-
blk.59.attn_output.weightQ4_0[7168 7168]
-
blk.59.attn_q.weightQ4_0[7168 7168]
-
blk.59.attn_v.weightQ4_0[7168 1024]
-
blk.60.attn_norm.weightF32[7168]
-
blk.60.ffn_down.weightQ4_0[19200 7168]
-
blk.60.ffn_gate.weightQ4_0[7168 19200]
-
blk.60.ffn_up.weightQ4_0[7168 19200]
-
blk.60.ffn_norm.weightF32[7168]
-
blk.60.attn_k.weightQ4_0[7168 1024]
-
blk.60.attn_output.weightQ4_0[7168 7168]
-
blk.60.attn_q.weightQ4_0[7168 7168]
-
blk.60.attn_v.weightQ4_0[7168 1024]
-
blk.61.attn_norm.weightF32[7168]
-
blk.61.ffn_down.weightQ4_0[19200 7168]
-
blk.61.ffn_gate.weightQ4_0[7168 19200]
-
blk.61.ffn_up.weightQ4_0[7168 19200]
-
blk.61.ffn_norm.weightF32[7168]
-
blk.61.attn_k.weightQ4_0[7168 1024]
-
blk.61.attn_output.weightQ4_0[7168 7168]
-
blk.61.attn_q.weightQ4_0[7168 7168]
-
blk.61.attn_v.weightQ4_0[7168 1024]
-
output.weightQ6_K[7168 32256]
-
output_norm.weightF32[7168]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61