latest
9.6GB
The Nanbeige2-16B-Chat is the latest 16B model developed by the Nanbeige Lab, which utilized 4.5T tokens of high-quality training data during the training phase.
49 Pulls Updated 4 months ago
ade5006c7378 · 9.6GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count40
-
llama.attention.head_count_kv40
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length13824
-
llama.rope.dimension_count128
-
llama.vocab_size59392
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id58978
-
tokenizer.ggml.eos_token_id58979
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[5120 59392]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[13824 5120]
-
blk.0.ffn_gate.weightQ4_K[5120 13824]
-
blk.0.ffn_up.weightQ4_K[5120 13824]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightQ4_K[5120 5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.attn_q.weightQ4_K[5120 5120]
-
blk.0.attn_v.weightQ6_K[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[13824 5120]
-
blk.1.ffn_gate.weightQ4_K[5120 13824]
-
blk.1.ffn_up.weightQ4_K[5120 13824]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightQ4_K[5120 5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.attn_q.weightQ4_K[5120 5120]
-
blk.1.attn_v.weightQ6_K[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[13824 5120]
-
blk.2.ffn_gate.weightQ4_K[5120 13824]
-
blk.2.ffn_up.weightQ4_K[5120 13824]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightQ4_K[5120 5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.attn_q.weightQ4_K[5120 5120]
-
blk.2.attn_v.weightQ6_K[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ6_K[13824 5120]
-
blk.3.ffn_gate.weightQ4_K[5120 13824]
-
blk.3.ffn_up.weightQ4_K[5120 13824]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightQ4_K[5120 5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.attn_q.weightQ4_K[5120 5120]
-
blk.3.attn_v.weightQ6_K[5120 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[13824 5120]
-
blk.4.ffn_gate.weightQ4_K[5120 13824]
-
blk.4.ffn_up.weightQ4_K[5120 13824]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightQ4_K[5120 5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.attn_q.weightQ4_K[5120 5120]
-
blk.4.attn_v.weightQ6_K[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ6_K[13824 5120]
-
blk.5.ffn_gate.weightQ4_K[5120 13824]
-
blk.5.ffn_up.weightQ4_K[5120 13824]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightQ4_K[5120 5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.attn_q.weightQ4_K[5120 5120]
-
blk.5.attn_v.weightQ6_K[5120 5120]
-
blk.6.ffn_gate.weightQ4_K[5120 13824]
-
blk.6.ffn_up.weightQ4_K[5120 13824]
-
blk.6.attn_k.weightQ4_K[5120 5120]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.attn_q.weightQ4_K[5120 5120]
-
blk.6.attn_v.weightQ4_K[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_K[13824 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ6_K[13824 5120]
-
blk.7.ffn_gate.weightQ4_K[5120 13824]
-
blk.7.ffn_up.weightQ4_K[5120 13824]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightQ4_K[5120 5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.attn_q.weightQ4_K[5120 5120]
-
blk.7.attn_v.weightQ4_K[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_K[13824 5120]
-
blk.8.ffn_gate.weightQ4_K[5120 13824]
-
blk.8.ffn_up.weightQ4_K[5120 13824]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightQ4_K[5120 5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.attn_q.weightQ4_K[5120 5120]
-
blk.8.attn_v.weightQ4_K[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_K[13824 5120]
-
blk.9.ffn_gate.weightQ4_K[5120 13824]
-
blk.9.ffn_up.weightQ4_K[5120 13824]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightQ4_K[5120 5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.attn_q.weightQ4_K[5120 5120]
-
blk.9.attn_v.weightQ6_K[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_K[13824 5120]
-
blk.10.ffn_gate.weightQ4_K[5120 13824]
-
blk.10.ffn_up.weightQ4_K[5120 13824]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightQ4_K[5120 5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.attn_q.weightQ4_K[5120 5120]
-
blk.10.attn_v.weightQ4_K[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ4_K[13824 5120]
-
blk.11.ffn_gate.weightQ4_K[5120 13824]
-
blk.11.ffn_up.weightQ4_K[5120 13824]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightQ4_K[5120 5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.attn_q.weightQ4_K[5120 5120]
-
blk.11.attn_v.weightQ6_K[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ6_K[13824 5120]
-
blk.12.ffn_gate.weightQ4_K[5120 13824]
-
blk.12.ffn_up.weightQ4_K[5120 13824]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightQ4_K[5120 5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.attn_q.weightQ4_K[5120 5120]
-
blk.12.attn_v.weightQ4_K[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_K[13824 5120]
-
blk.13.ffn_gate.weightQ4_K[5120 13824]
-
blk.13.ffn_up.weightQ4_K[5120 13824]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightQ4_K[5120 5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.attn_q.weightQ4_K[5120 5120]
-
blk.13.attn_v.weightQ4_K[5120 5120]
-
blk.14.ffn_gate.weightQ4_K[5120 13824]
-
blk.14.attn_k.weightQ4_K[5120 5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.attn_q.weightQ4_K[5120 5120]
-
blk.14.attn_v.weightQ6_K[5120 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ6_K[13824 5120]
-
blk.14.ffn_up.weightQ4_K[5120 13824]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_K[13824 5120]
-
blk.15.ffn_gate.weightQ4_K[5120 13824]
-
blk.15.ffn_up.weightQ4_K[5120 13824]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.weightQ4_K[5120 5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.attn_q.weightQ4_K[5120 5120]
-
blk.15.attn_v.weightQ4_K[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ4_K[13824 5120]
-
blk.16.ffn_gate.weightQ4_K[5120 13824]
-
blk.16.ffn_up.weightQ4_K[5120 13824]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightQ4_K[5120 5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.attn_q.weightQ4_K[5120 5120]
-
blk.16.attn_v.weightQ4_K[5120 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ6_K[13824 5120]
-
blk.17.ffn_gate.weightQ4_K[5120 13824]
-
blk.17.ffn_up.weightQ4_K[5120 13824]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightQ4_K[5120 5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.attn_q.weightQ4_K[5120 5120]
-
blk.17.attn_v.weightQ6_K[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_K[13824 5120]
-
blk.18.ffn_gate.weightQ4_K[5120 13824]
-
blk.18.ffn_up.weightQ4_K[5120 13824]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightQ4_K[5120 5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.attn_q.weightQ4_K[5120 5120]
-
blk.18.attn_v.weightQ4_K[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ4_K[13824 5120]
-
blk.19.ffn_gate.weightQ4_K[5120 13824]
-
blk.19.ffn_up.weightQ4_K[5120 13824]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightQ4_K[5120 5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.attn_q.weightQ4_K[5120 5120]
-
blk.19.attn_v.weightQ4_K[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ6_K[13824 5120]
-
blk.20.ffn_gate.weightQ4_K[5120 13824]
-
blk.20.ffn_up.weightQ4_K[5120 13824]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightQ4_K[5120 5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.attn_q.weightQ4_K[5120 5120]
-
blk.20.attn_v.weightQ6_K[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_K[13824 5120]
-
blk.21.ffn_gate.weightQ4_K[5120 13824]
-
blk.21.ffn_up.weightQ4_K[5120 13824]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weightQ4_K[5120 5120]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.attn_q.weightQ4_K[5120 5120]
-
blk.21.attn_v.weightQ4_K[5120 5120]
-
blk.22.attn_k.weightQ4_K[5120 5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.attn_q.weightQ4_K[5120 5120]
-
blk.22.attn_v.weightQ4_K[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ4_K[13824 5120]
-
blk.22.ffn_gate.weightQ4_K[5120 13824]
-
blk.22.ffn_up.weightQ4_K[5120 13824]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ6_K[13824 5120]
-
blk.23.ffn_gate.weightQ4_K[5120 13824]
-
blk.23.ffn_up.weightQ4_K[5120 13824]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightQ4_K[5120 5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.attn_q.weightQ4_K[5120 5120]
-
blk.23.attn_v.weightQ6_K[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_K[13824 5120]
-
blk.24.ffn_gate.weightQ4_K[5120 13824]
-
blk.24.ffn_up.weightQ4_K[5120 13824]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.weightQ4_K[5120 5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.attn_q.weightQ4_K[5120 5120]
-
blk.24.attn_v.weightQ4_K[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ4_K[13824 5120]
-
blk.25.ffn_gate.weightQ4_K[5120 13824]
-
blk.25.ffn_up.weightQ4_K[5120 13824]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightQ4_K[5120 5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.attn_q.weightQ4_K[5120 5120]
-
blk.25.attn_v.weightQ4_K[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ6_K[13824 5120]
-
blk.26.ffn_gate.weightQ4_K[5120 13824]
-
blk.26.ffn_up.weightQ4_K[5120 13824]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightQ4_K[5120 5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.attn_q.weightQ4_K[5120 5120]
-
blk.26.attn_v.weightQ6_K[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_K[13824 5120]
-
blk.27.ffn_gate.weightQ4_K[5120 13824]
-
blk.27.ffn_up.weightQ4_K[5120 13824]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightQ4_K[5120 5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.attn_q.weightQ4_K[5120 5120]
-
blk.27.attn_v.weightQ4_K[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ4_K[13824 5120]
-
blk.28.ffn_gate.weightQ4_K[5120 13824]
-
blk.28.ffn_up.weightQ4_K[5120 13824]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weightQ4_K[5120 5120]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.attn_q.weightQ4_K[5120 5120]
-
blk.28.attn_v.weightQ4_K[5120 5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ6_K[13824 5120]
-
blk.29.ffn_gate.weightQ4_K[5120 13824]
-
blk.29.ffn_up.weightQ4_K[5120 13824]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightQ4_K[5120 5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.attn_q.weightQ4_K[5120 5120]
-
blk.29.attn_v.weightQ6_K[5120 5120]
-
blk.30.attn_k.weightQ4_K[5120 5120]
-
blk.30.attn_q.weightQ4_K[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_K[13824 5120]
-
blk.30.ffn_gate.weightQ4_K[5120 13824]
-
blk.30.ffn_up.weightQ4_K[5120 13824]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.attn_v.weightQ4_K[5120 5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ4_K[13824 5120]
-
blk.31.ffn_gate.weightQ4_K[5120 13824]
-
blk.31.ffn_up.weightQ4_K[5120 13824]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightQ4_K[5120 5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.attn_q.weightQ4_K[5120 5120]
-
blk.31.attn_v.weightQ4_K[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ6_K[13824 5120]
-
blk.32.ffn_gate.weightQ4_K[5120 13824]
-
blk.32.ffn_up.weightQ4_K[5120 13824]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightQ4_K[5120 5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.attn_q.weightQ4_K[5120 5120]
-
blk.32.attn_v.weightQ6_K[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_K[13824 5120]
-
blk.33.ffn_gate.weightQ4_K[5120 13824]
-
blk.33.ffn_up.weightQ4_K[5120 13824]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.weightQ4_K[5120 5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.attn_q.weightQ4_K[5120 5120]
-
blk.33.attn_v.weightQ4_K[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ4_K[13824 5120]
-
blk.34.ffn_gate.weightQ4_K[5120 13824]
-
blk.34.ffn_up.weightQ4_K[5120 13824]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightQ4_K[5120 5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.attn_q.weightQ4_K[5120 5120]
-
blk.34.attn_v.weightQ4_K[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[13824 5120]
-
blk.35.ffn_gate.weightQ4_K[5120 13824]
-
blk.35.ffn_up.weightQ4_K[5120 13824]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weightQ4_K[5120 5120]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.attn_q.weightQ4_K[5120 5120]
-
blk.35.attn_v.weightQ6_K[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ4_K[13824 5120]
-
blk.36.ffn_gate.weightQ4_K[5120 13824]
-
blk.36.ffn_up.weightQ4_K[5120 13824]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightQ4_K[5120 5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.attn_q.weightQ4_K[5120 5120]
-
blk.36.attn_v.weightQ4_K[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ4_K[13824 5120]
-
blk.37.ffn_gate.weightQ4_K[5120 13824]
-
blk.37.ffn_up.weightQ4_K[5120 13824]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightQ4_K[5120 5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.attn_q.weightQ4_K[5120 5120]
-
blk.37.attn_v.weightQ4_K[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[13824 5120]
-
blk.38.ffn_gate.weightQ4_K[5120 13824]
-
blk.38.ffn_up.weightQ4_K[5120 13824]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightQ4_K[5120 5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.attn_q.weightQ4_K[5120 5120]
-
blk.38.attn_v.weightQ6_K[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ4_K[13824 5120]
-
blk.39.ffn_gate.weightQ4_K[5120 13824]
-
blk.39.ffn_up.weightQ4_K[5120 13824]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightQ4_K[5120 5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.attn_q.weightQ4_K[5120 5120]
-
blk.39.attn_v.weightQ4_K[5120 5120]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightQ4_K[13824 5120]
-
blk.40.ffn_gate.weightQ4_K[5120 13824]
-
blk.40.ffn_up.weightQ4_K[5120 13824]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.weightQ4_K[5120 5120]
-
blk.40.attn_output.weightQ4_K[5120 5120]
-
blk.40.attn_q.weightQ4_K[5120 5120]
-
blk.40.attn_v.weightQ4_K[5120 5120]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightQ6_K[13824 5120]
-
blk.41.ffn_gate.weightQ4_K[5120 13824]
-
blk.41.ffn_up.weightQ4_K[5120 13824]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.weightQ4_K[5120 5120]
-
blk.41.attn_output.weightQ4_K[5120 5120]
-
blk.41.attn_q.weightQ4_K[5120 5120]
-
blk.41.attn_v.weightQ6_K[5120 5120]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightQ6_K[13824 5120]
-
blk.42.ffn_gate.weightQ4_K[5120 13824]
-
blk.42.ffn_up.weightQ4_K[5120 13824]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.weightQ4_K[5120 5120]
-
blk.42.attn_output.weightQ4_K[5120 5120]
-
blk.42.attn_q.weightQ4_K[5120 5120]
-
blk.42.attn_v.weightQ6_K[5120 5120]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightQ6_K[13824 5120]
-
blk.43.ffn_gate.weightQ4_K[5120 13824]
-
blk.43.ffn_up.weightQ4_K[5120 13824]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.weightQ4_K[5120 5120]
-
blk.43.attn_output.weightQ4_K[5120 5120]
-
blk.43.attn_q.weightQ4_K[5120 5120]
-
blk.43.attn_v.weightQ6_K[5120 5120]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightQ6_K[13824 5120]
-
blk.44.ffn_gate.weightQ4_K[5120 13824]
-
blk.44.ffn_up.weightQ4_K[5120 13824]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.weightQ4_K[5120 5120]
-
blk.44.attn_output.weightQ4_K[5120 5120]
-
blk.44.attn_q.weightQ4_K[5120 5120]
-
blk.44.attn_v.weightQ6_K[5120 5120]
-
blk.45.ffn_gate.weightQ4_K[5120 13824]
-
blk.45.ffn_up.weightQ4_K[5120 13824]
-
blk.45.attn_k.weightQ4_K[5120 5120]
-
blk.45.attn_output.weightQ4_K[5120 5120]
-
blk.45.attn_q.weightQ4_K[5120 5120]
-
blk.45.attn_v.weightQ6_K[5120 5120]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightQ6_K[13824 5120]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightQ6_K[13824 5120]
-
blk.46.ffn_gate.weightQ4_K[5120 13824]
-
blk.46.ffn_up.weightQ4_K[5120 13824]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.weightQ4_K[5120 5120]
-
blk.46.attn_output.weightQ4_K[5120 5120]
-
blk.46.attn_q.weightQ4_K[5120 5120]
-
blk.46.attn_v.weightQ6_K[5120 5120]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightQ6_K[13824 5120]
-
blk.47.ffn_gate.weightQ4_K[5120 13824]
-
blk.47.ffn_up.weightQ4_K[5120 13824]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.weightQ4_K[5120 5120]
-
blk.47.attn_output.weightQ4_K[5120 5120]
-
blk.47.attn_q.weightQ4_K[5120 5120]
-
blk.47.attn_v.weightQ6_K[5120 5120]
-
output.weightQ6_K[5120 59392]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47