latest
21GB
SUS-Chat-34B is a 34B bilingual Chinese-English dialogue model, jointly released by the Southern University of Science and Technology and IDEA-CCNL.
34B
65 Pulls Updated 9 months ago
2b4c9e915a81 · 21GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count60
-
llama.context_length8192
-
llama.embedding_length7168
-
llama.feed_forward_length20480
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[7168 64000]
-
blk.0.attn_q.weightQ4_K[7168 7168]
-
blk.0.attn_k.weightQ4_K[7168 1024]
-
blk.0.attn_v.weightQ6_K[7168 1024]
-
blk.0.attn_output.weightQ4_K[7168 7168]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.0.ffn_gate.weightQ4_K[7168 20480]
-
blk.0.ffn_up.weightQ4_K[7168 20480]
-
blk.0.ffn_down.weightQ6_K[20480 7168]
-
blk.1.attn_q.weightQ4_K[7168 7168]
-
blk.1.attn_k.weightQ4_K[7168 1024]
-
blk.1.attn_v.weightQ6_K[7168 1024]
-
blk.1.attn_output.weightQ4_K[7168 7168]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.1.ffn_gate.weightQ4_K[7168 20480]
-
blk.1.ffn_up.weightQ4_K[7168 20480]
-
blk.1.ffn_down.weightQ6_K[20480 7168]
-
blk.2.attn_q.weightQ4_K[7168 7168]
-
blk.2.attn_k.weightQ4_K[7168 1024]
-
blk.2.attn_v.weightQ6_K[7168 1024]
-
blk.2.attn_output.weightQ4_K[7168 7168]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.2.ffn_gate.weightQ4_K[7168 20480]
-
blk.2.ffn_up.weightQ4_K[7168 20480]
-
blk.2.ffn_down.weightQ6_K[20480 7168]
-
blk.3.attn_q.weightQ4_K[7168 7168]
-
blk.3.attn_k.weightQ4_K[7168 1024]
-
blk.3.attn_v.weightQ6_K[7168 1024]
-
blk.3.attn_output.weightQ4_K[7168 7168]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.3.ffn_gate.weightQ4_K[7168 20480]
-
blk.3.ffn_up.weightQ4_K[7168 20480]
-
blk.3.ffn_down.weightQ6_K[20480 7168]
-
blk.4.attn_q.weightQ4_K[7168 7168]
-
blk.4.attn_k.weightQ4_K[7168 1024]
-
blk.4.attn_v.weightQ6_K[7168 1024]
-
blk.4.attn_output.weightQ4_K[7168 7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.4.ffn_gate.weightQ4_K[7168 20480]
-
blk.4.ffn_up.weightQ4_K[7168 20480]
-
blk.4.ffn_down.weightQ6_K[20480 7168]
-
blk.5.attn_q.weightQ4_K[7168 7168]
-
blk.5.attn_k.weightQ4_K[7168 1024]
-
blk.5.attn_v.weightQ6_K[7168 1024]
-
blk.5.attn_output.weightQ4_K[7168 7168]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.5.ffn_gate.weightQ4_K[7168 20480]
-
blk.5.ffn_up.weightQ4_K[7168 20480]
-
blk.5.ffn_down.weightQ6_K[20480 7168]
-
blk.6.attn_q.weightQ4_K[7168 7168]
-
blk.6.attn_k.weightQ4_K[7168 1024]
-
blk.6.attn_v.weightQ6_K[7168 1024]
-
blk.6.attn_output.weightQ4_K[7168 7168]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.6.ffn_gate.weightQ4_K[7168 20480]
-
blk.6.ffn_up.weightQ4_K[7168 20480]
-
blk.6.ffn_down.weightQ6_K[20480 7168]
-
blk.7.attn_q.weightQ4_K[7168 7168]
-
blk.7.attn_k.weightQ4_K[7168 1024]
-
blk.7.attn_v.weightQ4_K[7168 1024]
-
blk.7.attn_output.weightQ4_K[7168 7168]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.7.ffn_gate.weightQ4_K[7168 20480]
-
blk.7.ffn_up.weightQ4_K[7168 20480]
-
blk.7.ffn_down.weightQ4_K[20480 7168]
-
blk.8.attn_q.weightQ4_K[7168 7168]
-
blk.8.attn_k.weightQ4_K[7168 1024]
-
blk.8.attn_v.weightQ4_K[7168 1024]
-
blk.8.attn_output.weightQ4_K[7168 7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.8.ffn_gate.weightQ4_K[7168 20480]
-
blk.8.ffn_up.weightQ4_K[7168 20480]
-
blk.8.ffn_down.weightQ4_K[20480 7168]
-
blk.9.attn_q.weightQ4_K[7168 7168]
-
blk.9.attn_k.weightQ4_K[7168 1024]
-
blk.9.attn_v.weightQ6_K[7168 1024]
-
blk.9.attn_output.weightQ4_K[7168 7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.9.ffn_gate.weightQ4_K[7168 20480]
-
blk.9.ffn_up.weightQ4_K[7168 20480]
-
blk.9.ffn_down.weightQ6_K[20480 7168]
-
blk.10.attn_q.weightQ4_K[7168 7168]
-
blk.10.attn_k.weightQ4_K[7168 1024]
-
blk.10.attn_v.weightQ4_K[7168 1024]
-
blk.10.attn_output.weightQ4_K[7168 7168]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.10.ffn_gate.weightQ4_K[7168 20480]
-
blk.10.ffn_up.weightQ4_K[7168 20480]
-
blk.10.ffn_down.weightQ4_K[20480 7168]
-
blk.11.attn_q.weightQ4_K[7168 7168]
-
blk.11.attn_k.weightQ4_K[7168 1024]
-
blk.11.attn_v.weightQ4_K[7168 1024]
-
blk.11.attn_output.weightQ4_K[7168 7168]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.11.ffn_gate.weightQ4_K[7168 20480]
-
blk.11.ffn_up.weightQ4_K[7168 20480]
-
blk.11.ffn_down.weightQ4_K[20480 7168]
-
blk.12.attn_q.weightQ4_K[7168 7168]
-
blk.12.attn_k.weightQ4_K[7168 1024]
-
blk.12.attn_v.weightQ6_K[7168 1024]
-
blk.12.attn_output.weightQ4_K[7168 7168]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.12.ffn_gate.weightQ4_K[7168 20480]
-
blk.12.ffn_up.weightQ4_K[7168 20480]
-
blk.12.ffn_down.weightQ6_K[20480 7168]
-
blk.13.attn_q.weightQ4_K[7168 7168]
-
blk.13.attn_k.weightQ4_K[7168 1024]
-
blk.13.attn_v.weightQ4_K[7168 1024]
-
blk.13.attn_output.weightQ4_K[7168 7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.13.ffn_gate.weightQ4_K[7168 20480]
-
blk.13.ffn_up.weightQ4_K[7168 20480]
-
blk.13.ffn_down.weightQ4_K[20480 7168]
-
blk.14.attn_q.weightQ4_K[7168 7168]
-
blk.14.attn_k.weightQ4_K[7168 1024]
-
blk.14.attn_v.weightQ4_K[7168 1024]
-
blk.14.attn_output.weightQ4_K[7168 7168]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.14.ffn_gate.weightQ4_K[7168 20480]
-
blk.14.ffn_up.weightQ4_K[7168 20480]
-
blk.14.ffn_down.weightQ4_K[20480 7168]
-
blk.15.attn_q.weightQ4_K[7168 7168]
-
blk.15.attn_k.weightQ4_K[7168 1024]
-
blk.15.attn_v.weightQ6_K[7168 1024]
-
blk.15.attn_output.weightQ4_K[7168 7168]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.15.ffn_gate.weightQ4_K[7168 20480]
-
blk.15.ffn_up.weightQ4_K[7168 20480]
-
blk.15.ffn_down.weightQ6_K[20480 7168]
-
blk.16.attn_q.weightQ4_K[7168 7168]
-
blk.16.attn_k.weightQ4_K[7168 1024]
-
blk.16.attn_v.weightQ4_K[7168 1024]
-
blk.16.attn_output.weightQ4_K[7168 7168]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.16.ffn_gate.weightQ4_K[7168 20480]
-
blk.16.ffn_up.weightQ4_K[7168 20480]
-
blk.16.ffn_down.weightQ4_K[20480 7168]
-
blk.17.attn_q.weightQ4_K[7168 7168]
-
blk.17.attn_k.weightQ4_K[7168 1024]
-
blk.17.attn_v.weightQ4_K[7168 1024]
-
blk.17.attn_output.weightQ4_K[7168 7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.17.ffn_gate.weightQ4_K[7168 20480]
-
blk.17.ffn_up.weightQ4_K[7168 20480]
-
blk.17.ffn_down.weightQ4_K[20480 7168]
-
blk.18.attn_q.weightQ4_K[7168 7168]
-
blk.18.attn_k.weightQ4_K[7168 1024]
-
blk.18.attn_v.weightQ6_K[7168 1024]
-
blk.18.attn_output.weightQ4_K[7168 7168]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.18.ffn_gate.weightQ4_K[7168 20480]
-
blk.18.ffn_up.weightQ4_K[7168 20480]
-
blk.18.ffn_down.weightQ6_K[20480 7168]
-
blk.19.attn_q.weightQ4_K[7168 7168]
-
blk.19.attn_k.weightQ4_K[7168 1024]
-
blk.19.attn_v.weightQ4_K[7168 1024]
-
blk.19.attn_output.weightQ4_K[7168 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.19.ffn_gate.weightQ4_K[7168 20480]
-
blk.19.ffn_up.weightQ4_K[7168 20480]
-
blk.19.ffn_down.weightQ4_K[20480 7168]
-
blk.20.attn_q.weightQ4_K[7168 7168]
-
blk.20.attn_k.weightQ4_K[7168 1024]
-
blk.20.attn_v.weightQ4_K[7168 1024]
-
blk.20.attn_output.weightQ4_K[7168 7168]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.20.ffn_gate.weightQ4_K[7168 20480]
-
blk.20.ffn_up.weightQ4_K[7168 20480]
-
blk.20.ffn_down.weightQ4_K[20480 7168]
-
blk.21.attn_q.weightQ4_K[7168 7168]
-
blk.21.attn_k.weightQ4_K[7168 1024]
-
blk.21.attn_v.weightQ6_K[7168 1024]
-
blk.21.attn_output.weightQ4_K[7168 7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.21.ffn_gate.weightQ4_K[7168 20480]
-
blk.21.ffn_up.weightQ4_K[7168 20480]
-
blk.21.ffn_down.weightQ6_K[20480 7168]
-
blk.22.attn_q.weightQ4_K[7168 7168]
-
blk.22.attn_k.weightQ4_K[7168 1024]
-
blk.22.attn_v.weightQ4_K[7168 1024]
-
blk.22.attn_output.weightQ4_K[7168 7168]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.22.ffn_gate.weightQ4_K[7168 20480]
-
blk.22.ffn_up.weightQ4_K[7168 20480]
-
blk.22.ffn_down.weightQ4_K[20480 7168]
-
blk.23.attn_q.weightQ4_K[7168 7168]
-
blk.23.attn_k.weightQ4_K[7168 1024]
-
blk.23.attn_v.weightQ4_K[7168 1024]
-
blk.23.attn_output.weightQ4_K[7168 7168]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.23.ffn_gate.weightQ4_K[7168 20480]
-
blk.23.ffn_up.weightQ4_K[7168 20480]
-
blk.23.ffn_down.weightQ4_K[20480 7168]
-
blk.24.attn_q.weightQ4_K[7168 7168]
-
blk.24.attn_k.weightQ4_K[7168 1024]
-
blk.24.attn_v.weightQ6_K[7168 1024]
-
blk.24.attn_output.weightQ4_K[7168 7168]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.24.ffn_gate.weightQ4_K[7168 20480]
-
blk.24.ffn_up.weightQ4_K[7168 20480]
-
blk.24.ffn_down.weightQ6_K[20480 7168]
-
blk.25.attn_q.weightQ4_K[7168 7168]
-
blk.25.attn_k.weightQ4_K[7168 1024]
-
blk.25.attn_v.weightQ4_K[7168 1024]
-
blk.25.attn_output.weightQ4_K[7168 7168]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.25.ffn_gate.weightQ4_K[7168 20480]
-
blk.25.ffn_up.weightQ4_K[7168 20480]
-
blk.25.ffn_down.weightQ4_K[20480 7168]
-
blk.26.attn_q.weightQ4_K[7168 7168]
-
blk.26.attn_k.weightQ4_K[7168 1024]
-
blk.26.attn_v.weightQ4_K[7168 1024]
-
blk.26.attn_output.weightQ4_K[7168 7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.26.ffn_gate.weightQ4_K[7168 20480]
-
blk.26.ffn_up.weightQ4_K[7168 20480]
-
blk.26.ffn_down.weightQ4_K[20480 7168]
-
blk.27.attn_q.weightQ4_K[7168 7168]
-
blk.27.attn_k.weightQ4_K[7168 1024]
-
blk.27.attn_v.weightQ6_K[7168 1024]
-
blk.27.attn_output.weightQ4_K[7168 7168]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.27.ffn_gate.weightQ4_K[7168 20480]
-
blk.27.ffn_up.weightQ4_K[7168 20480]
-
blk.27.ffn_down.weightQ6_K[20480 7168]
-
blk.28.attn_q.weightQ4_K[7168 7168]
-
blk.28.attn_k.weightQ4_K[7168 1024]
-
blk.28.attn_v.weightQ4_K[7168 1024]
-
blk.28.attn_output.weightQ4_K[7168 7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.28.ffn_gate.weightQ4_K[7168 20480]
-
blk.28.ffn_up.weightQ4_K[7168 20480]
-
blk.28.ffn_down.weightQ4_K[20480 7168]
-
blk.29.attn_q.weightQ4_K[7168 7168]
-
blk.29.attn_k.weightQ4_K[7168 1024]
-
blk.29.attn_v.weightQ4_K[7168 1024]
-
blk.29.attn_output.weightQ4_K[7168 7168]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.29.ffn_gate.weightQ4_K[7168 20480]
-
blk.29.ffn_up.weightQ4_K[7168 20480]
-
blk.29.ffn_down.weightQ4_K[20480 7168]
-
blk.30.attn_q.weightQ4_K[7168 7168]
-
blk.30.attn_k.weightQ4_K[7168 1024]
-
blk.30.attn_v.weightQ6_K[7168 1024]
-
blk.30.attn_output.weightQ4_K[7168 7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.30.ffn_gate.weightQ4_K[7168 20480]
-
blk.30.ffn_up.weightQ4_K[7168 20480]
-
blk.30.ffn_down.weightQ6_K[20480 7168]
-
blk.31.attn_q.weightQ4_K[7168 7168]
-
blk.31.attn_k.weightQ4_K[7168 1024]
-
blk.31.attn_v.weightQ4_K[7168 1024]
-
blk.31.attn_output.weightQ4_K[7168 7168]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.31.ffn_gate.weightQ4_K[7168 20480]
-
blk.31.ffn_up.weightQ4_K[7168 20480]
-
blk.31.ffn_down.weightQ4_K[20480 7168]
-
blk.32.attn_q.weightQ4_K[7168 7168]
-
blk.32.attn_k.weightQ4_K[7168 1024]
-
blk.32.attn_v.weightQ4_K[7168 1024]
-
blk.32.attn_output.weightQ4_K[7168 7168]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.32.ffn_gate.weightQ4_K[7168 20480]
-
blk.32.ffn_up.weightQ4_K[7168 20480]
-
blk.32.ffn_down.weightQ4_K[20480 7168]
-
blk.33.attn_q.weightQ4_K[7168 7168]
-
blk.33.attn_k.weightQ4_K[7168 1024]
-
blk.33.attn_v.weightQ6_K[7168 1024]
-
blk.33.attn_output.weightQ4_K[7168 7168]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.33.ffn_gate.weightQ4_K[7168 20480]
-
blk.33.ffn_up.weightQ4_K[7168 20480]
-
blk.33.ffn_down.weightQ6_K[20480 7168]
-
blk.34.attn_q.weightQ4_K[7168 7168]
-
blk.34.attn_k.weightQ4_K[7168 1024]
-
blk.34.attn_v.weightQ4_K[7168 1024]
-
blk.34.attn_output.weightQ4_K[7168 7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.34.ffn_gate.weightQ4_K[7168 20480]
-
blk.34.ffn_up.weightQ4_K[7168 20480]
-
blk.34.ffn_down.weightQ4_K[20480 7168]
-
blk.35.attn_q.weightQ4_K[7168 7168]
-
blk.35.attn_k.weightQ4_K[7168 1024]
-
blk.35.attn_v.weightQ4_K[7168 1024]
-
blk.35.attn_output.weightQ4_K[7168 7168]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.35.ffn_gate.weightQ4_K[7168 20480]
-
blk.35.ffn_up.weightQ4_K[7168 20480]
-
blk.35.ffn_down.weightQ4_K[20480 7168]
-
blk.36.attn_q.weightQ4_K[7168 7168]
-
blk.36.attn_k.weightQ4_K[7168 1024]
-
blk.36.attn_v.weightQ6_K[7168 1024]
-
blk.36.attn_output.weightQ4_K[7168 7168]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.36.ffn_gate.weightQ4_K[7168 20480]
-
blk.36.ffn_up.weightQ4_K[7168 20480]
-
blk.36.ffn_down.weightQ6_K[20480 7168]
-
blk.37.attn_q.weightQ4_K[7168 7168]
-
blk.37.attn_k.weightQ4_K[7168 1024]
-
blk.37.attn_v.weightQ4_K[7168 1024]
-
blk.37.attn_output.weightQ4_K[7168 7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.37.ffn_gate.weightQ4_K[7168 20480]
-
blk.37.ffn_up.weightQ4_K[7168 20480]
-
blk.37.ffn_down.weightQ4_K[20480 7168]
-
blk.38.attn_q.weightQ4_K[7168 7168]
-
blk.38.attn_k.weightQ4_K[7168 1024]
-
blk.38.attn_v.weightQ4_K[7168 1024]
-
blk.38.attn_output.weightQ4_K[7168 7168]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.38.ffn_gate.weightQ4_K[7168 20480]
-
blk.38.ffn_up.weightQ4_K[7168 20480]
-
blk.38.ffn_down.weightQ4_K[20480 7168]
-
blk.39.attn_q.weightQ4_K[7168 7168]
-
blk.39.attn_k.weightQ4_K[7168 1024]
-
blk.39.attn_v.weightQ6_K[7168 1024]
-
blk.39.attn_output.weightQ4_K[7168 7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.39.ffn_gate.weightQ4_K[7168 20480]
-
blk.39.ffn_up.weightQ4_K[7168 20480]
-
blk.39.ffn_down.weightQ6_K[20480 7168]
-
blk.40.attn_q.weightQ4_K[7168 7168]
-
blk.40.attn_k.weightQ4_K[7168 1024]
-
blk.40.attn_v.weightQ4_K[7168 1024]
-
blk.40.attn_output.weightQ4_K[7168 7168]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.40.ffn_gate.weightQ4_K[7168 20480]
-
blk.40.ffn_up.weightQ4_K[7168 20480]
-
blk.40.ffn_down.weightQ4_K[20480 7168]
-
blk.41.attn_q.weightQ4_K[7168 7168]
-
blk.41.attn_k.weightQ4_K[7168 1024]
-
blk.41.attn_v.weightQ4_K[7168 1024]
-
blk.41.attn_output.weightQ4_K[7168 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.41.ffn_gate.weightQ4_K[7168 20480]
-
blk.41.ffn_up.weightQ4_K[7168 20480]
-
blk.41.ffn_down.weightQ4_K[20480 7168]
-
blk.42.attn_q.weightQ4_K[7168 7168]
-
blk.42.attn_k.weightQ4_K[7168 1024]
-
blk.42.attn_v.weightQ6_K[7168 1024]
-
blk.42.attn_output.weightQ4_K[7168 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.42.ffn_gate.weightQ4_K[7168 20480]
-
blk.42.ffn_up.weightQ4_K[7168 20480]
-
blk.42.ffn_down.weightQ6_K[20480 7168]
-
blk.43.attn_q.weightQ4_K[7168 7168]
-
blk.43.attn_k.weightQ4_K[7168 1024]
-
blk.43.attn_v.weightQ4_K[7168 1024]
-
blk.43.attn_output.weightQ4_K[7168 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.43.ffn_gate.weightQ4_K[7168 20480]
-
blk.43.ffn_up.weightQ4_K[7168 20480]
-
blk.43.ffn_down.weightQ4_K[20480 7168]
-
blk.44.attn_q.weightQ4_K[7168 7168]
-
blk.44.attn_k.weightQ4_K[7168 1024]
-
blk.44.attn_v.weightQ4_K[7168 1024]
-
blk.44.attn_output.weightQ4_K[7168 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.44.ffn_gate.weightQ4_K[7168 20480]
-
blk.44.ffn_up.weightQ4_K[7168 20480]
-
blk.44.ffn_down.weightQ4_K[20480 7168]
-
blk.45.attn_q.weightQ4_K[7168 7168]
-
blk.45.attn_k.weightQ4_K[7168 1024]
-
blk.45.attn_v.weightQ6_K[7168 1024]
-
blk.45.attn_output.weightQ4_K[7168 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.45.ffn_gate.weightQ4_K[7168 20480]
-
blk.45.ffn_up.weightQ4_K[7168 20480]
-
blk.45.ffn_down.weightQ6_K[20480 7168]
-
blk.46.attn_q.weightQ4_K[7168 7168]
-
blk.46.attn_k.weightQ4_K[7168 1024]
-
blk.46.attn_v.weightQ4_K[7168 1024]
-
blk.46.attn_output.weightQ4_K[7168 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.46.ffn_gate.weightQ4_K[7168 20480]
-
blk.46.ffn_up.weightQ4_K[7168 20480]
-
blk.46.ffn_down.weightQ4_K[20480 7168]
-
blk.47.attn_q.weightQ4_K[7168 7168]
-
blk.47.attn_k.weightQ4_K[7168 1024]
-
blk.47.attn_v.weightQ4_K[7168 1024]
-
blk.47.attn_output.weightQ4_K[7168 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.47.ffn_gate.weightQ4_K[7168 20480]
-
blk.47.ffn_up.weightQ4_K[7168 20480]
-
blk.47.ffn_down.weightQ4_K[20480 7168]
-
blk.48.attn_q.weightQ4_K[7168 7168]
-
blk.48.attn_k.weightQ4_K[7168 1024]
-
blk.48.attn_v.weightQ6_K[7168 1024]
-
blk.48.attn_output.weightQ4_K[7168 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.48.ffn_gate.weightQ4_K[7168 20480]
-
blk.48.ffn_up.weightQ4_K[7168 20480]
-
blk.48.ffn_down.weightQ6_K[20480 7168]
-
blk.49.attn_q.weightQ4_K[7168 7168]
-
blk.49.attn_k.weightQ4_K[7168 1024]
-
blk.49.attn_v.weightQ4_K[7168 1024]
-
blk.49.attn_output.weightQ4_K[7168 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.49.ffn_gate.weightQ4_K[7168 20480]
-
blk.49.ffn_up.weightQ4_K[7168 20480]
-
blk.49.ffn_down.weightQ4_K[20480 7168]
-
blk.50.attn_q.weightQ4_K[7168 7168]
-
blk.50.attn_k.weightQ4_K[7168 1024]
-
blk.50.attn_v.weightQ4_K[7168 1024]
-
blk.50.attn_output.weightQ4_K[7168 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.50.ffn_gate.weightQ4_K[7168 20480]
-
blk.50.ffn_up.weightQ4_K[7168 20480]
-
blk.50.ffn_down.weightQ4_K[20480 7168]
-
blk.51.attn_q.weightQ4_K[7168 7168]
-
blk.51.attn_k.weightQ4_K[7168 1024]
-
blk.51.attn_v.weightQ6_K[7168 1024]
-
blk.51.attn_output.weightQ4_K[7168 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.51.ffn_gate.weightQ4_K[7168 20480]
-
blk.51.ffn_up.weightQ4_K[7168 20480]
-
blk.51.ffn_down.weightQ6_K[20480 7168]
-
blk.52.attn_q.weightQ4_K[7168 7168]
-
blk.52.attn_k.weightQ4_K[7168 1024]
-
blk.52.attn_v.weightQ6_K[7168 1024]
-
blk.52.attn_output.weightQ4_K[7168 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.52.ffn_gate.weightQ4_K[7168 20480]
-
blk.52.ffn_up.weightQ4_K[7168 20480]
-
blk.52.ffn_down.weightQ6_K[20480 7168]
-
blk.53.attn_q.weightQ4_K[7168 7168]
-
blk.53.attn_k.weightQ4_K[7168 1024]
-
blk.53.attn_v.weightQ6_K[7168 1024]
-
blk.53.attn_output.weightQ4_K[7168 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.53.ffn_gate.weightQ4_K[7168 20480]
-
blk.53.ffn_up.weightQ4_K[7168 20480]
-
blk.53.ffn_down.weightQ6_K[20480 7168]
-
blk.54.attn_q.weightQ4_K[7168 7168]
-
blk.54.attn_k.weightQ4_K[7168 1024]
-
blk.54.attn_v.weightQ6_K[7168 1024]
-
blk.54.attn_output.weightQ4_K[7168 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.54.ffn_gate.weightQ4_K[7168 20480]
-
blk.54.ffn_up.weightQ4_K[7168 20480]
-
blk.54.ffn_down.weightQ6_K[20480 7168]
-
blk.55.attn_q.weightQ4_K[7168 7168]
-
blk.55.attn_k.weightQ4_K[7168 1024]
-
blk.55.attn_v.weightQ6_K[7168 1024]
-
blk.55.attn_output.weightQ4_K[7168 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.55.ffn_gate.weightQ4_K[7168 20480]
-
blk.55.ffn_up.weightQ4_K[7168 20480]
-
blk.55.ffn_down.weightQ6_K[20480 7168]
-
blk.56.attn_q.weightQ4_K[7168 7168]
-
blk.56.attn_k.weightQ4_K[7168 1024]
-
blk.56.attn_v.weightQ6_K[7168 1024]
-
blk.56.attn_output.weightQ4_K[7168 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.56.ffn_gate.weightQ4_K[7168 20480]
-
blk.56.ffn_up.weightQ4_K[7168 20480]
-
blk.56.ffn_down.weightQ6_K[20480 7168]
-
blk.57.attn_q.weightQ4_K[7168 7168]
-
blk.57.attn_k.weightQ4_K[7168 1024]
-
blk.57.attn_v.weightQ6_K[7168 1024]
-
blk.57.attn_output.weightQ4_K[7168 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.57.ffn_gate.weightQ4_K[7168 20480]
-
blk.57.ffn_up.weightQ4_K[7168 20480]
-
blk.57.ffn_down.weightQ6_K[20480 7168]
-
blk.58.attn_q.weightQ4_K[7168 7168]
-
blk.58.attn_k.weightQ4_K[7168 1024]
-
blk.58.attn_v.weightQ6_K[7168 1024]
-
blk.58.attn_output.weightQ4_K[7168 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.58.ffn_gate.weightQ4_K[7168 20480]
-
blk.58.ffn_up.weightQ4_K[7168 20480]
-
blk.58.ffn_down.weightQ6_K[20480 7168]
-
blk.59.attn_q.weightQ4_K[7168 7168]
-
blk.59.attn_k.weightQ4_K[7168 1024]
-
blk.59.attn_v.weightQ6_K[7168 1024]
-
blk.59.attn_output.weightQ4_K[7168 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.59.ffn_gate.weightQ4_K[7168 20480]
-
blk.59.ffn_up.weightQ4_K[7168 20480]
-
blk.59.ffn_down.weightQ6_K[20480 7168]
-
output_norm.weightF32[7168]
-
output.weightQ6_K[7168 64000]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59