latest
80GB
8x22B
Updated 2 months ago
cfcf93119280 · 80GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count56
-
llama.context_length65536
-
llama.embedding_length6144
-
llama.expert_count8
-
llama.expert_used_count2
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32000
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
NameTypeShape
-
token_embd.weightQ4_0[6144 32000]
-
blk.0.ffn_gate_inp.weightF16[6144 8]
-
blk.0.attn_k.weightQ8_0[6144 1024]
-
blk.0.attn_output.weightQ4_0[6144 6144]
-
blk.0.attn_q.weightQ4_0[6144 6144]
-
blk.0.attn_v.weightQ8_0[6144 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.0.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.0.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.1.ffn_gate_inp.weightF16[6144 8]
-
blk.1.attn_k.weightQ8_0[6144 1024]
-
blk.1.attn_output.weightQ4_0[6144 6144]
-
blk.1.attn_q.weightQ4_0[6144 6144]
-
blk.1.attn_v.weightQ8_0[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.1.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.1.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.2.ffn_gate_inp.weightF16[6144 8]
-
blk.2.attn_k.weightQ8_0[6144 1024]
-
blk.2.attn_output.weightQ4_0[6144 6144]
-
blk.2.attn_q.weightQ4_0[6144 6144]
-
blk.2.attn_v.weightQ8_0[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.2.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.2.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.3.ffn_gate_inp.weightF16[6144 8]
-
blk.3.attn_k.weightQ8_0[6144 1024]
-
blk.3.attn_output.weightQ4_0[6144 6144]
-
blk.3.attn_q.weightQ4_0[6144 6144]
-
blk.3.attn_v.weightQ8_0[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.3.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.3.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.4.ffn_gate_inp.weightF16[6144 8]
-
blk.4.attn_k.weightQ8_0[6144 1024]
-
blk.4.attn_output.weightQ4_0[6144 6144]
-
blk.4.attn_q.weightQ4_0[6144 6144]
-
blk.4.attn_v.weightQ8_0[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.4.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.4.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.5.ffn_gate_inp.weightF16[6144 8]
-
blk.5.attn_k.weightQ8_0[6144 1024]
-
blk.5.attn_output.weightQ4_0[6144 6144]
-
blk.5.attn_q.weightQ4_0[6144 6144]
-
blk.5.attn_v.weightQ8_0[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.5.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.5.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.6.ffn_gate_inp.weightF16[6144 8]
-
blk.6.attn_k.weightQ8_0[6144 1024]
-
blk.6.attn_output.weightQ4_0[6144 6144]
-
blk.6.attn_q.weightQ4_0[6144 6144]
-
blk.6.attn_v.weightQ8_0[6144 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.6.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.6.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.7.ffn_gate_inp.weightF16[6144 8]
-
blk.7.attn_k.weightQ8_0[6144 1024]
-
blk.7.attn_output.weightQ4_0[6144 6144]
-
blk.7.attn_q.weightQ4_0[6144 6144]
-
blk.7.attn_v.weightQ8_0[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.7.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.7.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.8.ffn_gate_inp.weightF16[6144 8]
-
blk.8.attn_k.weightQ8_0[6144 1024]
-
blk.8.attn_output.weightQ4_0[6144 6144]
-
blk.8.attn_q.weightQ4_0[6144 6144]
-
blk.8.attn_v.weightQ8_0[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.8.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.8.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.9.ffn_gate_inp.weightF16[6144 8]
-
blk.9.attn_k.weightQ8_0[6144 1024]
-
blk.9.attn_output.weightQ4_0[6144 6144]
-
blk.9.attn_q.weightQ4_0[6144 6144]
-
blk.9.attn_v.weightQ8_0[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.9.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.9.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.10.ffn_gate_inp.weightF16[6144 8]
-
blk.10.attn_k.weightQ8_0[6144 1024]
-
blk.10.attn_output.weightQ4_0[6144 6144]
-
blk.10.attn_q.weightQ4_0[6144 6144]
-
blk.10.attn_v.weightQ8_0[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.10.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.10.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.11.ffn_gate_inp.weightF16[6144 8]
-
blk.11.attn_k.weightQ8_0[6144 1024]
-
blk.11.attn_output.weightQ4_0[6144 6144]
-
blk.11.attn_q.weightQ4_0[6144 6144]
-
blk.11.attn_v.weightQ8_0[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.11.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.11.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.12.ffn_gate_inp.weightF16[6144 8]
-
blk.12.attn_k.weightQ8_0[6144 1024]
-
blk.12.attn_output.weightQ4_0[6144 6144]
-
blk.12.attn_q.weightQ4_0[6144 6144]
-
blk.12.attn_v.weightQ8_0[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.12.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.12.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.13.ffn_gate_inp.weightF16[6144 8]
-
blk.13.attn_k.weightQ8_0[6144 1024]
-
blk.13.attn_output.weightQ4_0[6144 6144]
-
blk.13.attn_q.weightQ4_0[6144 6144]
-
blk.13.attn_v.weightQ8_0[6144 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.13.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.13.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.14.ffn_gate_inp.weightF16[6144 8]
-
blk.14.attn_k.weightQ8_0[6144 1024]
-
blk.14.attn_output.weightQ4_0[6144 6144]
-
blk.14.attn_q.weightQ4_0[6144 6144]
-
blk.14.attn_v.weightQ8_0[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.14.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.14.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.15.ffn_gate_inp.weightF16[6144 8]
-
blk.15.attn_k.weightQ8_0[6144 1024]
-
blk.15.attn_output.weightQ4_0[6144 6144]
-
blk.15.attn_q.weightQ4_0[6144 6144]
-
blk.15.attn_v.weightQ8_0[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.15.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.15.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.16.ffn_gate_inp.weightF16[6144 8]
-
blk.16.attn_k.weightQ8_0[6144 1024]
-
blk.16.attn_output.weightQ4_0[6144 6144]
-
blk.16.attn_q.weightQ4_0[6144 6144]
-
blk.16.attn_v.weightQ8_0[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.16.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.16.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.17.ffn_gate_inp.weightF16[6144 8]
-
blk.17.attn_k.weightQ8_0[6144 1024]
-
blk.17.attn_output.weightQ4_0[6144 6144]
-
blk.17.attn_q.weightQ4_0[6144 6144]
-
blk.17.attn_v.weightQ8_0[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.17.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.17.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.18.ffn_gate_inp.weightF16[6144 8]
-
blk.18.attn_k.weightQ8_0[6144 1024]
-
blk.18.attn_output.weightQ4_0[6144 6144]
-
blk.18.attn_q.weightQ4_0[6144 6144]
-
blk.18.attn_v.weightQ8_0[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.18.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.18.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.19.ffn_gate_inp.weightF16[6144 8]
-
blk.19.attn_k.weightQ8_0[6144 1024]
-
blk.19.attn_output.weightQ4_0[6144 6144]
-
blk.19.attn_q.weightQ4_0[6144 6144]
-
blk.19.attn_v.weightQ8_0[6144 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.19.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.19.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.20.ffn_gate_inp.weightF16[6144 8]
-
blk.20.attn_k.weightQ8_0[6144 1024]
-
blk.20.attn_output.weightQ4_0[6144 6144]
-
blk.20.attn_q.weightQ4_0[6144 6144]
-
blk.20.attn_v.weightQ8_0[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.20.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.20.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.21.ffn_gate_inp.weightF16[6144 8]
-
blk.21.attn_k.weightQ8_0[6144 1024]
-
blk.21.attn_output.weightQ4_0[6144 6144]
-
blk.21.attn_q.weightQ4_0[6144 6144]
-
blk.21.attn_v.weightQ8_0[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.21.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.21.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.22.ffn_gate_inp.weightF16[6144 8]
-
blk.22.attn_k.weightQ8_0[6144 1024]
-
blk.22.attn_output.weightQ4_0[6144 6144]
-
blk.22.attn_q.weightQ4_0[6144 6144]
-
blk.22.attn_v.weightQ8_0[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.22.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.22.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.23.attn_k.weightQ8_0[6144 1024]
-
blk.23.attn_q.weightQ4_0[6144 6144]
-
blk.23.attn_v.weightQ8_0[6144 1024]
-
blk.23.ffn_gate_inp.weightF16[6144 8]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_output.weightQ4_0[6144 6144]
-
blk.23.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.23.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.23.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.24.attn_k.weightQ8_0[6144 1024]
-
blk.24.attn_q.weightQ4_0[6144 6144]
-
blk.24.ffn_gate_inp.weightF16[6144 8]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.attn_output.weightQ4_0[6144 6144]
-
blk.24.attn_v.weightQ8_0[6144 1024]
-
blk.24.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.24.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.24.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.25.attn_q.weightQ4_0[6144 6144]
-
blk.25.ffn_gate_inp.weightF16[6144 8]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightQ8_0[6144 1024]
-
blk.25.attn_output.weightQ4_0[6144 6144]
-
blk.25.attn_v.weightQ8_0[6144 1024]
-
blk.25.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.25.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.25.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.26.ffn_gate_inp.weightF16[6144 8]
-
blk.26.attn_k.weightQ8_0[6144 1024]
-
blk.26.attn_output.weightQ4_0[6144 6144]
-
blk.26.attn_q.weightQ4_0[6144 6144]
-
blk.26.attn_v.weightQ8_0[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.26.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.26.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.27.ffn_gate_inp.weightF16[6144 8]
-
blk.27.attn_k.weightQ8_0[6144 1024]
-
blk.27.attn_output.weightQ4_0[6144 6144]
-
blk.27.attn_q.weightQ4_0[6144 6144]
-
blk.27.attn_v.weightQ8_0[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.27.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.27.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.28.ffn_gate_inp.weightF16[6144 8]
-
blk.28.attn_k.weightQ8_0[6144 1024]
-
blk.28.attn_output.weightQ4_0[6144 6144]
-
blk.28.attn_q.weightQ4_0[6144 6144]
-
blk.28.attn_v.weightQ8_0[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.28.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.28.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.29.ffn_gate_inp.weightF16[6144 8]
-
blk.29.attn_k.weightQ8_0[6144 1024]
-
blk.29.attn_output.weightQ4_0[6144 6144]
-
blk.29.attn_q.weightQ4_0[6144 6144]
-
blk.29.attn_v.weightQ8_0[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.29.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.29.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.30.ffn_gate_inp.weightF16[6144 8]
-
blk.30.attn_k.weightQ8_0[6144 1024]
-
blk.30.attn_output.weightQ4_0[6144 6144]
-
blk.30.attn_q.weightQ4_0[6144 6144]
-
blk.30.attn_v.weightQ8_0[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.30.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.30.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.31.ffn_gate_inp.weightF16[6144 8]
-
blk.31.attn_k.weightQ8_0[6144 1024]
-
blk.31.attn_output.weightQ4_0[6144 6144]
-
blk.31.attn_q.weightQ4_0[6144 6144]
-
blk.31.attn_v.weightQ8_0[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.31.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.31.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.32.ffn_gate_inp.weightF16[6144 8]
-
blk.32.attn_k.weightQ8_0[6144 1024]
-
blk.32.attn_output.weightQ4_0[6144 6144]
-
blk.32.attn_q.weightQ4_0[6144 6144]
-
blk.32.attn_v.weightQ8_0[6144 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.32.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.32.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.33.ffn_gate_inp.weightF16[6144 8]
-
blk.33.attn_k.weightQ8_0[6144 1024]
-
blk.33.attn_output.weightQ4_0[6144 6144]
-
blk.33.attn_q.weightQ4_0[6144 6144]
-
blk.33.attn_v.weightQ8_0[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.33.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.33.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.34.ffn_gate_inp.weightF16[6144 8]
-
blk.34.attn_k.weightQ8_0[6144 1024]
-
blk.34.attn_output.weightQ4_0[6144 6144]
-
blk.34.attn_q.weightQ4_0[6144 6144]
-
blk.34.attn_v.weightQ8_0[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.34.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.34.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.35.ffn_gate_inp.weightF16[6144 8]
-
blk.35.attn_k.weightQ8_0[6144 1024]
-
blk.35.attn_output.weightQ4_0[6144 6144]
-
blk.35.attn_q.weightQ4_0[6144 6144]
-
blk.35.attn_v.weightQ8_0[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.35.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.35.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.36.ffn_gate_inp.weightF16[6144 8]
-
blk.36.attn_k.weightQ8_0[6144 1024]
-
blk.36.attn_output.weightQ4_0[6144 6144]
-
blk.36.attn_q.weightQ4_0[6144 6144]
-
blk.36.attn_v.weightQ8_0[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.36.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.36.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.37.ffn_gate_inp.weightF16[6144 8]
-
blk.37.attn_k.weightQ8_0[6144 1024]
-
blk.37.attn_output.weightQ4_0[6144 6144]
-
blk.37.attn_q.weightQ4_0[6144 6144]
-
blk.37.attn_v.weightQ8_0[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.37.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.37.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.38.ffn_gate_inp.weightF16[6144 8]
-
blk.38.attn_k.weightQ8_0[6144 1024]
-
blk.38.attn_output.weightQ4_0[6144 6144]
-
blk.38.attn_q.weightQ4_0[6144 6144]
-
blk.38.attn_v.weightQ8_0[6144 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.38.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.38.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.39.ffn_gate_inp.weightF16[6144 8]
-
blk.39.attn_k.weightQ8_0[6144 1024]
-
blk.39.attn_output.weightQ4_0[6144 6144]
-
blk.39.attn_q.weightQ4_0[6144 6144]
-
blk.39.attn_v.weightQ8_0[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.39.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.39.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.40.ffn_gate_inp.weightF16[6144 8]
-
blk.40.attn_k.weightQ8_0[6144 1024]
-
blk.40.attn_output.weightQ4_0[6144 6144]
-
blk.40.attn_q.weightQ4_0[6144 6144]
-
blk.40.attn_v.weightQ8_0[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.40.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.40.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.41.ffn_gate_inp.weightF16[6144 8]
-
blk.41.attn_k.weightQ8_0[6144 1024]
-
blk.41.attn_output.weightQ4_0[6144 6144]
-
blk.41.attn_q.weightQ4_0[6144 6144]
-
blk.41.attn_v.weightQ8_0[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.41.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.41.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.42.ffn_gate_inp.weightF16[6144 8]
-
blk.42.attn_k.weightQ8_0[6144 1024]
-
blk.42.attn_output.weightQ4_0[6144 6144]
-
blk.42.attn_q.weightQ4_0[6144 6144]
-
blk.42.attn_v.weightQ8_0[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.42.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.42.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.43.ffn_gate_inp.weightF16[6144 8]
-
blk.43.attn_k.weightQ8_0[6144 1024]
-
blk.43.attn_output.weightQ4_0[6144 6144]
-
blk.43.attn_q.weightQ4_0[6144 6144]
-
blk.43.attn_v.weightQ8_0[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.43.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.43.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.44.ffn_gate_inp.weightF16[6144 8]
-
blk.44.attn_k.weightQ8_0[6144 1024]
-
blk.44.attn_output.weightQ4_0[6144 6144]
-
blk.44.attn_q.weightQ4_0[6144 6144]
-
blk.44.attn_v.weightQ8_0[6144 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.44.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.44.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.45.ffn_gate_inp.weightF16[6144 8]
-
blk.45.attn_k.weightQ8_0[6144 1024]
-
blk.45.attn_output.weightQ4_0[6144 6144]
-
blk.45.attn_q.weightQ4_0[6144 6144]
-
blk.45.attn_v.weightQ8_0[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.45.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.45.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.46.ffn_gate_inp.weightF16[6144 8]
-
blk.46.attn_k.weightQ8_0[6144 1024]
-
blk.46.attn_output.weightQ4_0[6144 6144]
-
blk.46.attn_q.weightQ4_0[6144 6144]
-
blk.46.attn_v.weightQ8_0[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.46.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.46.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.47.ffn_gate_inp.weightF16[6144 8]
-
blk.47.attn_k.weightQ8_0[6144 1024]
-
blk.47.attn_output.weightQ4_0[6144 6144]
-
blk.47.attn_q.weightQ4_0[6144 6144]
-
blk.47.attn_v.weightQ8_0[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.47.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.47.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.48.ffn_gate_inp.weightF16[6144 8]
-
blk.48.attn_k.weightQ8_0[6144 1024]
-
blk.48.attn_output.weightQ4_0[6144 6144]
-
blk.48.attn_q.weightQ4_0[6144 6144]
-
blk.48.attn_v.weightQ8_0[6144 1024]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.48.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.48.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.48.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.49.ffn_gate_inp.weightF16[6144 8]
-
blk.49.attn_k.weightQ8_0[6144 1024]
-
blk.49.attn_output.weightQ4_0[6144 6144]
-
blk.49.attn_q.weightQ4_0[6144 6144]
-
blk.49.attn_v.weightQ8_0[6144 1024]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.49.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.49.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.49.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.50.attn_k.weightQ8_0[6144 1024]
-
blk.50.attn_q.weightQ4_0[6144 6144]
-
blk.50.attn_v.weightQ8_0[6144 1024]
-
blk.50.ffn_gate_inp.weightF16[6144 8]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_output.weightQ4_0[6144 6144]
-
blk.50.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.50.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.50.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.51.attn_k.weightQ8_0[6144 1024]
-
blk.51.attn_q.weightQ4_0[6144 6144]
-
blk.51.ffn_gate_inp.weightF16[6144 8]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_output.weightQ4_0[6144 6144]
-
blk.51.attn_v.weightQ8_0[6144 1024]
-
blk.51.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.51.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.51.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.52.attn_q.weightQ4_0[6144 6144]
-
blk.52.ffn_gate_inp.weightF16[6144 8]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightQ8_0[6144 1024]
-
blk.52.attn_output.weightQ4_0[6144 6144]
-
blk.52.attn_v.weightQ8_0[6144 1024]
-
blk.52.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.52.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.52.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.53.ffn_gate_inp.weightF16[6144 8]
-
blk.53.attn_k.weightQ8_0[6144 1024]
-
blk.53.attn_output.weightQ4_0[6144 6144]
-
blk.53.attn_q.weightQ4_0[6144 6144]
-
blk.53.attn_v.weightQ8_0[6144 1024]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.53.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.53.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.53.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.54.ffn_gate_inp.weightF16[6144 8]
-
blk.54.attn_k.weightQ8_0[6144 1024]
-
blk.54.attn_output.weightQ4_0[6144 6144]
-
blk.54.attn_q.weightQ4_0[6144 6144]
-
blk.54.attn_v.weightQ8_0[6144 1024]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.54.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.54.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.54.ffn_up_exps.weightQ4_0[6144 16384 8]
-
blk.55.ffn_gate_inp.weightF16[6144 8]
-
blk.55.attn_k.weightQ8_0[6144 1024]
-
blk.55.attn_output.weightQ4_0[6144 6144]
-
blk.55.attn_q.weightQ4_0[6144 6144]
-
blk.55.attn_v.weightQ8_0[6144 1024]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_norm.weightF32[6144]
-
blk.55.ffn_gate_exps.weightQ4_0[6144 16384 8]
-
blk.55.ffn_down_exps.weightQ4_0[16384 6144 8]
-
blk.55.ffn_up_exps.weightQ4_0[6144 16384 8]
-
output.weightQ6_K[6144 32000]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55