latest
19GB
codeFuse-deepseek-33b is a 33B Code-LLM finetuned by QLoRA on multiple code-related tasks on the base model deepseek-coder-33b.
Tools
33B
40 Pulls Updated 5 weeks ago
08d3f6958c9e · 19GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count62
-
llama.context_length16384
-
llama.embedding_length7168
-
llama.feed_forward_length19200
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
llama.vocab_size32256
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32014
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.predeepseek-coder
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[7168 32256]
-
blk.0.attn_q.weightQ4_0[7168 7168]
-
blk.0.attn_k.weightQ4_0[7168 1024]
-
blk.0.attn_v.weightQ4_0[7168 1024]
-
blk.0.attn_output.weightQ4_0[7168 7168]
-
blk.0.ffn_gate.weightQ4_0[7168 19200]
-
blk.0.ffn_up.weightQ4_0[7168 19200]
-
blk.0.ffn_down.weightQ4_0[19200 7168]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.1.attn_q.weightQ4_0[7168 7168]
-
blk.1.attn_k.weightQ4_0[7168 1024]
-
blk.1.attn_v.weightQ4_0[7168 1024]
-
blk.1.attn_output.weightQ4_0[7168 7168]
-
blk.1.ffn_gate.weightQ4_0[7168 19200]
-
blk.1.ffn_up.weightQ4_0[7168 19200]
-
blk.1.ffn_down.weightQ4_0[19200 7168]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.2.attn_q.weightQ4_0[7168 7168]
-
blk.2.attn_k.weightQ4_0[7168 1024]
-
blk.2.attn_v.weightQ4_0[7168 1024]
-
blk.2.attn_output.weightQ4_0[7168 7168]
-
blk.2.ffn_gate.weightQ4_0[7168 19200]
-
blk.2.ffn_up.weightQ4_0[7168 19200]
-
blk.2.ffn_down.weightQ4_0[19200 7168]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.3.attn_q.weightQ4_0[7168 7168]
-
blk.3.attn_k.weightQ4_0[7168 1024]
-
blk.3.attn_v.weightQ4_0[7168 1024]
-
blk.3.attn_output.weightQ4_0[7168 7168]
-
blk.3.ffn_gate.weightQ4_0[7168 19200]
-
blk.3.ffn_up.weightQ4_0[7168 19200]
-
blk.3.ffn_down.weightQ4_0[19200 7168]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_q.weightQ4_0[7168 7168]
-
blk.4.attn_k.weightQ4_0[7168 1024]
-
blk.4.attn_v.weightQ4_0[7168 1024]
-
blk.4.attn_output.weightQ4_0[7168 7168]
-
blk.4.ffn_gate.weightQ4_0[7168 19200]
-
blk.4.ffn_up.weightQ4_0[7168 19200]
-
blk.4.ffn_down.weightQ4_0[19200 7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.5.attn_q.weightQ4_0[7168 7168]
-
blk.5.attn_k.weightQ4_0[7168 1024]
-
blk.5.attn_v.weightQ4_0[7168 1024]
-
blk.5.attn_output.weightQ4_0[7168 7168]
-
blk.5.ffn_gate.weightQ4_0[7168 19200]
-
blk.5.ffn_up.weightQ4_0[7168 19200]
-
blk.5.ffn_down.weightQ4_0[19200 7168]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.6.attn_q.weightQ4_0[7168 7168]
-
blk.6.attn_k.weightQ4_0[7168 1024]
-
blk.6.attn_v.weightQ4_0[7168 1024]
-
blk.6.attn_output.weightQ4_0[7168 7168]
-
blk.6.ffn_gate.weightQ4_0[7168 19200]
-
blk.6.ffn_up.weightQ4_0[7168 19200]
-
blk.6.ffn_down.weightQ4_0[19200 7168]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.7.attn_q.weightQ4_0[7168 7168]
-
blk.7.attn_k.weightQ4_0[7168 1024]
-
blk.7.attn_v.weightQ4_0[7168 1024]
-
blk.7.attn_output.weightQ4_0[7168 7168]
-
blk.7.ffn_gate.weightQ4_0[7168 19200]
-
blk.7.ffn_up.weightQ4_0[7168 19200]
-
blk.7.ffn_down.weightQ4_0[19200 7168]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_q.weightQ4_0[7168 7168]
-
blk.8.attn_k.weightQ4_0[7168 1024]
-
blk.8.attn_v.weightQ4_0[7168 1024]
-
blk.8.attn_output.weightQ4_0[7168 7168]
-
blk.8.ffn_gate.weightQ4_0[7168 19200]
-
blk.8.ffn_up.weightQ4_0[7168 19200]
-
blk.8.ffn_down.weightQ4_0[19200 7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.9.attn_q.weightQ4_0[7168 7168]
-
blk.9.attn_k.weightQ4_0[7168 1024]
-
blk.9.attn_v.weightQ4_0[7168 1024]
-
blk.9.attn_output.weightQ4_0[7168 7168]
-
blk.9.ffn_gate.weightQ4_0[7168 19200]
-
blk.9.ffn_up.weightQ4_0[7168 19200]
-
blk.9.ffn_down.weightQ4_0[19200 7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.10.attn_q.weightQ4_0[7168 7168]
-
blk.10.attn_k.weightQ4_0[7168 1024]
-
blk.10.attn_v.weightQ4_0[7168 1024]
-
blk.10.attn_output.weightQ4_0[7168 7168]
-
blk.10.ffn_gate.weightQ4_0[7168 19200]
-
blk.10.ffn_up.weightQ4_0[7168 19200]
-
blk.10.ffn_down.weightQ4_0[19200 7168]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.11.attn_q.weightQ4_0[7168 7168]
-
blk.11.attn_k.weightQ4_0[7168 1024]
-
blk.11.attn_v.weightQ4_0[7168 1024]
-
blk.11.attn_output.weightQ4_0[7168 7168]
-
blk.11.ffn_gate.weightQ4_0[7168 19200]
-
blk.11.ffn_up.weightQ4_0[7168 19200]
-
blk.11.ffn_down.weightQ4_0[19200 7168]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.12.attn_q.weightQ4_0[7168 7168]
-
blk.12.attn_k.weightQ4_0[7168 1024]
-
blk.12.attn_v.weightQ4_0[7168 1024]
-
blk.12.attn_output.weightQ4_0[7168 7168]
-
blk.12.ffn_gate.weightQ4_0[7168 19200]
-
blk.12.ffn_up.weightQ4_0[7168 19200]
-
blk.12.ffn_down.weightQ4_0[19200 7168]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_q.weightQ4_0[7168 7168]
-
blk.13.attn_k.weightQ4_0[7168 1024]
-
blk.13.attn_v.weightQ4_0[7168 1024]
-
blk.13.attn_output.weightQ4_0[7168 7168]
-
blk.13.ffn_gate.weightQ4_0[7168 19200]
-
blk.13.ffn_up.weightQ4_0[7168 19200]
-
blk.13.ffn_down.weightQ4_0[19200 7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.14.attn_q.weightQ4_0[7168 7168]
-
blk.14.attn_k.weightQ4_0[7168 1024]
-
blk.14.attn_v.weightQ4_0[7168 1024]
-
blk.14.attn_output.weightQ4_0[7168 7168]
-
blk.14.ffn_gate.weightQ4_0[7168 19200]
-
blk.14.ffn_up.weightQ4_0[7168 19200]
-
blk.14.ffn_down.weightQ4_0[19200 7168]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.15.attn_q.weightQ4_0[7168 7168]
-
blk.15.attn_k.weightQ4_0[7168 1024]
-
blk.15.attn_v.weightQ4_0[7168 1024]
-
blk.15.attn_output.weightQ4_0[7168 7168]
-
blk.15.ffn_gate.weightQ4_0[7168 19200]
-
blk.15.ffn_up.weightQ4_0[7168 19200]
-
blk.15.ffn_down.weightQ4_0[19200 7168]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.16.attn_q.weightQ4_0[7168 7168]
-
blk.16.attn_k.weightQ4_0[7168 1024]
-
blk.16.attn_v.weightQ4_0[7168 1024]
-
blk.16.attn_output.weightQ4_0[7168 7168]
-
blk.16.ffn_gate.weightQ4_0[7168 19200]
-
blk.16.ffn_up.weightQ4_0[7168 19200]
-
blk.16.ffn_down.weightQ4_0[19200 7168]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_q.weightQ4_0[7168 7168]
-
blk.17.attn_k.weightQ4_0[7168 1024]
-
blk.17.attn_v.weightQ4_0[7168 1024]
-
blk.17.attn_output.weightQ4_0[7168 7168]
-
blk.17.ffn_gate.weightQ4_0[7168 19200]
-
blk.17.ffn_up.weightQ4_0[7168 19200]
-
blk.17.ffn_down.weightQ4_0[19200 7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.18.attn_q.weightQ4_0[7168 7168]
-
blk.18.attn_k.weightQ4_0[7168 1024]
-
blk.18.attn_v.weightQ4_0[7168 1024]
-
blk.18.attn_output.weightQ4_0[7168 7168]
-
blk.18.ffn_gate.weightQ4_0[7168 19200]
-
blk.18.ffn_up.weightQ4_0[7168 19200]
-
blk.18.ffn_down.weightQ4_0[19200 7168]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.19.attn_q.weightQ4_0[7168 7168]
-
blk.19.attn_k.weightQ4_0[7168 1024]
-
blk.19.attn_v.weightQ4_0[7168 1024]
-
blk.19.attn_output.weightQ4_0[7168 7168]
-
blk.19.ffn_gate.weightQ4_0[7168 19200]
-
blk.19.ffn_up.weightQ4_0[7168 19200]
-
blk.19.ffn_down.weightQ4_0[19200 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.20.attn_q.weightQ4_0[7168 7168]
-
blk.20.attn_k.weightQ4_0[7168 1024]
-
blk.20.attn_v.weightQ4_0[7168 1024]
-
blk.20.attn_output.weightQ4_0[7168 7168]
-
blk.20.ffn_gate.weightQ4_0[7168 19200]
-
blk.20.ffn_up.weightQ4_0[7168 19200]
-
blk.20.ffn_down.weightQ4_0[19200 7168]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_q.weightQ4_0[7168 7168]
-
blk.21.attn_k.weightQ4_0[7168 1024]
-
blk.21.attn_v.weightQ4_0[7168 1024]
-
blk.21.attn_output.weightQ4_0[7168 7168]
-
blk.21.ffn_gate.weightQ4_0[7168 19200]
-
blk.21.ffn_up.weightQ4_0[7168 19200]
-
blk.21.ffn_down.weightQ4_0[19200 7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.22.attn_q.weightQ4_0[7168 7168]
-
blk.22.attn_k.weightQ4_0[7168 1024]
-
blk.22.attn_v.weightQ4_0[7168 1024]
-
blk.22.attn_output.weightQ4_0[7168 7168]
-
blk.22.ffn_gate.weightQ4_0[7168 19200]
-
blk.22.ffn_up.weightQ4_0[7168 19200]
-
blk.22.ffn_down.weightQ4_0[19200 7168]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.23.attn_q.weightQ4_0[7168 7168]
-
blk.23.attn_k.weightQ4_0[7168 1024]
-
blk.23.attn_v.weightQ4_0[7168 1024]
-
blk.23.attn_output.weightQ4_0[7168 7168]
-
blk.23.ffn_gate.weightQ4_0[7168 19200]
-
blk.23.ffn_up.weightQ4_0[7168 19200]
-
blk.23.ffn_down.weightQ4_0[19200 7168]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.24.attn_q.weightQ4_0[7168 7168]
-
blk.24.attn_k.weightQ4_0[7168 1024]
-
blk.24.attn_v.weightQ4_0[7168 1024]
-
blk.24.attn_output.weightQ4_0[7168 7168]
-
blk.24.ffn_gate.weightQ4_0[7168 19200]
-
blk.24.ffn_up.weightQ4_0[7168 19200]
-
blk.24.ffn_down.weightQ4_0[19200 7168]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.25.attn_q.weightQ4_0[7168 7168]
-
blk.25.attn_k.weightQ4_0[7168 1024]
-
blk.25.attn_v.weightQ4_0[7168 1024]
-
blk.25.attn_output.weightQ4_0[7168 7168]
-
blk.25.ffn_gate.weightQ4_0[7168 19200]
-
blk.25.ffn_up.weightQ4_0[7168 19200]
-
blk.25.ffn_down.weightQ4_0[19200 7168]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_q.weightQ4_0[7168 7168]
-
blk.26.attn_k.weightQ4_0[7168 1024]
-
blk.26.attn_v.weightQ4_0[7168 1024]
-
blk.26.attn_output.weightQ4_0[7168 7168]
-
blk.26.ffn_gate.weightQ4_0[7168 19200]
-
blk.26.ffn_up.weightQ4_0[7168 19200]
-
blk.26.ffn_down.weightQ4_0[19200 7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.27.attn_q.weightQ4_0[7168 7168]
-
blk.27.attn_k.weightQ4_0[7168 1024]
-
blk.27.attn_v.weightQ4_0[7168 1024]
-
blk.27.attn_output.weightQ4_0[7168 7168]
-
blk.27.ffn_gate.weightQ4_0[7168 19200]
-
blk.27.ffn_up.weightQ4_0[7168 19200]
-
blk.27.ffn_down.weightQ4_0[19200 7168]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.28.attn_q.weightQ4_0[7168 7168]
-
blk.28.attn_k.weightQ4_0[7168 1024]
-
blk.28.attn_v.weightQ4_0[7168 1024]
-
blk.28.attn_output.weightQ4_0[7168 7168]
-
blk.28.ffn_gate.weightQ4_0[7168 19200]
-
blk.28.ffn_up.weightQ4_0[7168 19200]
-
blk.28.ffn_down.weightQ4_0[19200 7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.29.attn_q.weightQ4_0[7168 7168]
-
blk.29.attn_k.weightQ4_0[7168 1024]
-
blk.29.attn_v.weightQ4_0[7168 1024]
-
blk.29.attn_output.weightQ4_0[7168 7168]
-
blk.29.ffn_gate.weightQ4_0[7168 19200]
-
blk.29.ffn_up.weightQ4_0[7168 19200]
-
blk.29.ffn_down.weightQ4_0[19200 7168]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_q.weightQ4_0[7168 7168]
-
blk.30.attn_k.weightQ4_0[7168 1024]
-
blk.30.attn_v.weightQ4_0[7168 1024]
-
blk.30.attn_output.weightQ4_0[7168 7168]
-
blk.30.ffn_gate.weightQ4_0[7168 19200]
-
blk.30.ffn_up.weightQ4_0[7168 19200]
-
blk.30.ffn_down.weightQ4_0[19200 7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.31.attn_q.weightQ4_0[7168 7168]
-
blk.31.attn_k.weightQ4_0[7168 1024]
-
blk.31.attn_v.weightQ4_0[7168 1024]
-
blk.31.attn_output.weightQ4_0[7168 7168]
-
blk.31.ffn_gate.weightQ4_0[7168 19200]
-
blk.31.ffn_up.weightQ4_0[7168 19200]
-
blk.31.ffn_down.weightQ4_0[19200 7168]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.32.attn_q.weightQ4_0[7168 7168]
-
blk.32.attn_k.weightQ4_0[7168 1024]
-
blk.32.attn_v.weightQ4_0[7168 1024]
-
blk.32.attn_output.weightQ4_0[7168 7168]
-
blk.32.ffn_gate.weightQ4_0[7168 19200]
-
blk.32.ffn_up.weightQ4_0[7168 19200]
-
blk.32.ffn_down.weightQ4_0[19200 7168]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.33.attn_q.weightQ4_0[7168 7168]
-
blk.33.attn_k.weightQ4_0[7168 1024]
-
blk.33.attn_v.weightQ4_0[7168 1024]
-
blk.33.attn_output.weightQ4_0[7168 7168]
-
blk.33.ffn_gate.weightQ4_0[7168 19200]
-
blk.33.ffn_up.weightQ4_0[7168 19200]
-
blk.33.ffn_down.weightQ4_0[19200 7168]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_q.weightQ4_0[7168 7168]
-
blk.34.attn_k.weightQ4_0[7168 1024]
-
blk.34.attn_v.weightQ4_0[7168 1024]
-
blk.34.attn_output.weightQ4_0[7168 7168]
-
blk.34.ffn_gate.weightQ4_0[7168 19200]
-
blk.34.ffn_up.weightQ4_0[7168 19200]
-
blk.34.ffn_down.weightQ4_0[19200 7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.35.attn_q.weightQ4_0[7168 7168]
-
blk.35.attn_k.weightQ4_0[7168 1024]
-
blk.35.attn_v.weightQ4_0[7168 1024]
-
blk.35.attn_output.weightQ4_0[7168 7168]
-
blk.35.ffn_gate.weightQ4_0[7168 19200]
-
blk.35.ffn_up.weightQ4_0[7168 19200]
-
blk.35.ffn_down.weightQ4_0[19200 7168]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.36.attn_q.weightQ4_0[7168 7168]
-
blk.36.attn_k.weightQ4_0[7168 1024]
-
blk.36.attn_v.weightQ4_0[7168 1024]
-
blk.36.attn_output.weightQ4_0[7168 7168]
-
blk.36.ffn_gate.weightQ4_0[7168 19200]
-
blk.36.ffn_up.weightQ4_0[7168 19200]
-
blk.36.ffn_down.weightQ4_0[19200 7168]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.37.attn_q.weightQ4_0[7168 7168]
-
blk.37.attn_k.weightQ4_0[7168 1024]
-
blk.37.attn_v.weightQ4_0[7168 1024]
-
blk.37.attn_output.weightQ4_0[7168 7168]
-
blk.37.ffn_gate.weightQ4_0[7168 19200]
-
blk.37.ffn_up.weightQ4_0[7168 19200]
-
blk.37.ffn_down.weightQ4_0[19200 7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.38.attn_q.weightQ4_0[7168 7168]
-
blk.38.attn_k.weightQ4_0[7168 1024]
-
blk.38.attn_v.weightQ4_0[7168 1024]
-
blk.38.attn_output.weightQ4_0[7168 7168]
-
blk.38.ffn_gate.weightQ4_0[7168 19200]
-
blk.38.ffn_up.weightQ4_0[7168 19200]
-
blk.38.ffn_down.weightQ4_0[19200 7168]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_q.weightQ4_0[7168 7168]
-
blk.39.attn_k.weightQ4_0[7168 1024]
-
blk.39.attn_v.weightQ4_0[7168 1024]
-
blk.39.attn_output.weightQ4_0[7168 7168]
-
blk.39.ffn_gate.weightQ4_0[7168 19200]
-
blk.39.ffn_up.weightQ4_0[7168 19200]
-
blk.39.ffn_down.weightQ4_0[19200 7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.40.attn_q.weightQ4_0[7168 7168]
-
blk.40.attn_k.weightQ4_0[7168 1024]
-
blk.40.attn_v.weightQ4_0[7168 1024]
-
blk.40.attn_output.weightQ4_0[7168 7168]
-
blk.40.ffn_gate.weightQ4_0[7168 19200]
-
blk.40.ffn_up.weightQ4_0[7168 19200]
-
blk.40.ffn_down.weightQ4_0[19200 7168]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.41.attn_q.weightQ4_0[7168 7168]
-
blk.41.attn_k.weightQ4_0[7168 1024]
-
blk.41.attn_v.weightQ4_0[7168 1024]
-
blk.41.attn_output.weightQ4_0[7168 7168]
-
blk.41.ffn_gate.weightQ4_0[7168 19200]
-
blk.41.ffn_up.weightQ4_0[7168 19200]
-
blk.41.ffn_down.weightQ4_0[19200 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.42.attn_q.weightQ4_0[7168 7168]
-
blk.42.attn_k.weightQ4_0[7168 1024]
-
blk.42.attn_v.weightQ4_0[7168 1024]
-
blk.42.attn_output.weightQ4_0[7168 7168]
-
blk.42.ffn_gate.weightQ4_0[7168 19200]
-
blk.42.ffn_up.weightQ4_0[7168 19200]
-
blk.42.ffn_down.weightQ4_0[19200 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_q.weightQ4_0[7168 7168]
-
blk.43.attn_k.weightQ4_0[7168 1024]
-
blk.43.attn_v.weightQ4_0[7168 1024]
-
blk.43.attn_output.weightQ4_0[7168 7168]
-
blk.43.ffn_gate.weightQ4_0[7168 19200]
-
blk.43.ffn_up.weightQ4_0[7168 19200]
-
blk.43.ffn_down.weightQ4_0[19200 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.44.attn_q.weightQ4_0[7168 7168]
-
blk.44.attn_k.weightQ4_0[7168 1024]
-
blk.44.attn_v.weightQ4_0[7168 1024]
-
blk.44.attn_output.weightQ4_0[7168 7168]
-
blk.44.ffn_gate.weightQ4_0[7168 19200]
-
blk.44.ffn_up.weightQ4_0[7168 19200]
-
blk.44.ffn_down.weightQ4_0[19200 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.45.attn_q.weightQ4_0[7168 7168]
-
blk.45.attn_k.weightQ4_0[7168 1024]
-
blk.45.attn_v.weightQ4_0[7168 1024]
-
blk.45.attn_output.weightQ4_0[7168 7168]
-
blk.45.ffn_gate.weightQ4_0[7168 19200]
-
blk.45.ffn_up.weightQ4_0[7168 19200]
-
blk.45.ffn_down.weightQ4_0[19200 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.46.attn_q.weightQ4_0[7168 7168]
-
blk.46.attn_k.weightQ4_0[7168 1024]
-
blk.46.attn_v.weightQ4_0[7168 1024]
-
blk.46.attn_output.weightQ4_0[7168 7168]
-
blk.46.ffn_gate.weightQ4_0[7168 19200]
-
blk.46.ffn_up.weightQ4_0[7168 19200]
-
blk.46.ffn_down.weightQ4_0[19200 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_q.weightQ4_0[7168 7168]
-
blk.47.attn_k.weightQ4_0[7168 1024]
-
blk.47.attn_v.weightQ4_0[7168 1024]
-
blk.47.attn_output.weightQ4_0[7168 7168]
-
blk.47.ffn_gate.weightQ4_0[7168 19200]
-
blk.47.ffn_up.weightQ4_0[7168 19200]
-
blk.47.ffn_down.weightQ4_0[19200 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.48.attn_q.weightQ4_0[7168 7168]
-
blk.48.attn_k.weightQ4_0[7168 1024]
-
blk.48.attn_v.weightQ4_0[7168 1024]
-
blk.48.attn_output.weightQ4_0[7168 7168]
-
blk.48.ffn_gate.weightQ4_0[7168 19200]
-
blk.48.ffn_up.weightQ4_0[7168 19200]
-
blk.48.ffn_down.weightQ4_0[19200 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.49.attn_q.weightQ4_0[7168 7168]
-
blk.49.attn_k.weightQ4_0[7168 1024]
-
blk.49.attn_v.weightQ4_0[7168 1024]
-
blk.49.attn_output.weightQ4_0[7168 7168]
-
blk.49.ffn_gate.weightQ4_0[7168 19200]
-
blk.49.ffn_up.weightQ4_0[7168 19200]
-
blk.49.ffn_down.weightQ4_0[19200 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.50.attn_q.weightQ4_0[7168 7168]
-
blk.50.attn_k.weightQ4_0[7168 1024]
-
blk.50.attn_v.weightQ4_0[7168 1024]
-
blk.50.attn_output.weightQ4_0[7168 7168]
-
blk.50.ffn_gate.weightQ4_0[7168 19200]
-
blk.50.ffn_up.weightQ4_0[7168 19200]
-
blk.50.ffn_down.weightQ4_0[19200 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.51.attn_q.weightQ4_0[7168 7168]
-
blk.51.attn_k.weightQ4_0[7168 1024]
-
blk.51.attn_v.weightQ4_0[7168 1024]
-
blk.51.attn_output.weightQ4_0[7168 7168]
-
blk.51.ffn_gate.weightQ4_0[7168 19200]
-
blk.51.ffn_up.weightQ4_0[7168 19200]
-
blk.51.ffn_down.weightQ4_0[19200 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_q.weightQ4_0[7168 7168]
-
blk.52.attn_k.weightQ4_0[7168 1024]
-
blk.52.attn_v.weightQ4_0[7168 1024]
-
blk.52.attn_output.weightQ4_0[7168 7168]
-
blk.52.ffn_gate.weightQ4_0[7168 19200]
-
blk.52.ffn_up.weightQ4_0[7168 19200]
-
blk.52.ffn_down.weightQ4_0[19200 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.53.attn_q.weightQ4_0[7168 7168]
-
blk.53.attn_k.weightQ4_0[7168 1024]
-
blk.53.attn_v.weightQ4_0[7168 1024]
-
blk.53.attn_output.weightQ4_0[7168 7168]
-
blk.53.ffn_gate.weightQ4_0[7168 19200]
-
blk.53.ffn_up.weightQ4_0[7168 19200]
-
blk.53.ffn_down.weightQ4_0[19200 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.54.attn_q.weightQ4_0[7168 7168]
-
blk.54.attn_k.weightQ4_0[7168 1024]
-
blk.54.attn_v.weightQ4_0[7168 1024]
-
blk.54.attn_output.weightQ4_0[7168 7168]
-
blk.54.ffn_gate.weightQ4_0[7168 19200]
-
blk.54.ffn_up.weightQ4_0[7168 19200]
-
blk.54.ffn_down.weightQ4_0[19200 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.55.attn_q.weightQ4_0[7168 7168]
-
blk.55.attn_k.weightQ4_0[7168 1024]
-
blk.55.attn_v.weightQ4_0[7168 1024]
-
blk.55.attn_output.weightQ4_0[7168 7168]
-
blk.55.ffn_gate.weightQ4_0[7168 19200]
-
blk.55.ffn_up.weightQ4_0[7168 19200]
-
blk.55.ffn_down.weightQ4_0[19200 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_q.weightQ4_0[7168 7168]
-
blk.56.attn_k.weightQ4_0[7168 1024]
-
blk.56.attn_v.weightQ4_0[7168 1024]
-
blk.56.attn_output.weightQ4_0[7168 7168]
-
blk.56.ffn_gate.weightQ4_0[7168 19200]
-
blk.56.ffn_up.weightQ4_0[7168 19200]
-
blk.56.ffn_down.weightQ4_0[19200 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.57.attn_q.weightQ4_0[7168 7168]
-
blk.57.attn_k.weightQ4_0[7168 1024]
-
blk.57.attn_v.weightQ4_0[7168 1024]
-
blk.57.attn_output.weightQ4_0[7168 7168]
-
blk.57.ffn_gate.weightQ4_0[7168 19200]
-
blk.57.ffn_up.weightQ4_0[7168 19200]
-
blk.57.ffn_down.weightQ4_0[19200 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.58.attn_q.weightQ4_0[7168 7168]
-
blk.58.attn_k.weightQ4_0[7168 1024]
-
blk.58.attn_v.weightQ4_0[7168 1024]
-
blk.58.attn_output.weightQ4_0[7168 7168]
-
blk.58.ffn_gate.weightQ4_0[7168 19200]
-
blk.58.ffn_up.weightQ4_0[7168 19200]
-
blk.58.ffn_down.weightQ4_0[19200 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.59.attn_q.weightQ4_0[7168 7168]
-
blk.59.attn_k.weightQ4_0[7168 1024]
-
blk.59.attn_v.weightQ4_0[7168 1024]
-
blk.59.attn_output.weightQ4_0[7168 7168]
-
blk.59.ffn_gate.weightQ4_0[7168 19200]
-
blk.59.ffn_up.weightQ4_0[7168 19200]
-
blk.59.ffn_down.weightQ4_0[19200 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.60.attn_q.weightQ4_0[7168 7168]
-
blk.60.attn_k.weightQ4_0[7168 1024]
-
blk.60.attn_v.weightQ4_0[7168 1024]
-
blk.60.attn_output.weightQ4_0[7168 7168]
-
blk.60.ffn_gate.weightQ4_0[7168 19200]
-
blk.60.ffn_up.weightQ4_0[7168 19200]
-
blk.60.ffn_down.weightQ4_0[19200 7168]
-
blk.60.attn_norm.weightF32[7168]
-
blk.60.ffn_norm.weightF32[7168]
-
blk.61.attn_q.weightQ4_0[7168 7168]
-
blk.61.attn_k.weightQ4_0[7168 1024]
-
blk.61.attn_v.weightQ4_0[7168 1024]
-
blk.61.attn_output.weightQ4_0[7168 7168]
-
blk.61.ffn_gate.weightQ4_0[7168 19200]
-
blk.61.ffn_up.weightQ4_0[7168 19200]
-
blk.61.ffn_down.weightQ4_0[19200 7168]
-
blk.61.attn_norm.weightF32[7168]
-
blk.61.ffn_norm.weightF32[7168]
-
output_norm.weightF32[7168]
-
output.weightQ6_K[7168 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61