Arcee-SuperNova-Medius is a 14B parameter language model developed by Arcee.ai, built on the Qwen2.5-14B-Instruct architecture.
Tools
14B
139 Pulls Updated 4 days ago
c3e6db263558 · 6.4GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.file/models_out/SuperNova-14B-GGUF/SuperNova-14B.imatrix
-
general.architectureqwen2
-
general.file_typeIQ3_XS
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-05
-
qwen2.block_count48
-
qwen2.context_length131072
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length13824
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightI32[5120 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightI32[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightI32[5120 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightI32[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.2.ffn_gate.weightI32[5120 13824]
-
blk.2.ffn_up.weightI32[5120 13824]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightI32[5120 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightI32[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.3.ffn_gate.weightI32[5120 13824]
-
blk.3.ffn_up.weightI32[5120 13824]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightI32[5120 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightI32[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.4.ffn_gate.weightI32[5120 13824]
-
blk.4.ffn_up.weightI32[5120 13824]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightI32[5120 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightI32[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.5.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightI32[5120 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightI32[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.6.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightI32[5120 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightI32[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.7.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightI32[5120 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightI32[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.8.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightI32[5120 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightI32[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.9.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightI32[5120 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightI32[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.10.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightI32[5120 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightI32[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.11.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightI32[5120 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightI32[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.12.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightI32[5120 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightI32[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.13.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightI32[5120 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightI32[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.14.ffn_gate.weightI32[5120 13824]
-
blk.14.ffn_up.weightI32[5120 13824]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightI32[5120 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightI32[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.15.ffn_gate.weightI32[5120 13824]
-
blk.15.ffn_up.weightI32[5120 13824]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightI32[5120 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightI32[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.16.ffn_gate.weightI32[5120 13824]
-
blk.16.ffn_up.weightI32[5120 13824]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightI32[5120 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightI32[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.17.ffn_gate.weightI32[5120 13824]
-
blk.17.ffn_up.weightI32[5120 13824]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightI32[5120 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightI32[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.18.ffn_gate.weightI32[5120 13824]
-
blk.18.ffn_up.weightI32[5120 13824]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightI32[5120 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightI32[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.19.ffn_gate.weightI32[5120 13824]
-
blk.19.ffn_up.weightI32[5120 13824]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightI32[5120 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightI32[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.20.ffn_gate.weightI32[5120 13824]
-
blk.20.ffn_up.weightI32[5120 13824]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightI32[5120 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightI32[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.21.ffn_gate.weightI32[5120 13824]
-
blk.21.ffn_up.weightI32[5120 13824]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightI32[5120 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightI32[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.22.ffn_gate.weightI32[5120 13824]
-
blk.22.ffn_up.weightI32[5120 13824]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightI32[5120 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightI32[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.23.ffn_gate.weightI32[5120 13824]
-
blk.23.ffn_up.weightI32[5120 13824]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightI32[5120 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightI32[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.24.ffn_gate.weightI32[5120 13824]
-
blk.24.ffn_up.weightI32[5120 13824]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightI32[5120 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightI32[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.25.ffn_gate.weightI32[5120 13824]
-
blk.25.ffn_up.weightI32[5120 13824]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightI32[5120 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightI32[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.26.ffn_gate.weightI32[5120 13824]
-
blk.26.ffn_up.weightI32[5120 13824]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightI32[5120 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightI32[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.27.ffn_gate.weightI32[5120 13824]
-
blk.27.ffn_up.weightI32[5120 13824]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightI32[5120 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightI32[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.28.ffn_gate.weightI32[5120 13824]
-
blk.28.ffn_up.weightI32[5120 13824]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightI32[5120 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightI32[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.29.ffn_gate.weightI32[5120 13824]
-
blk.29.ffn_up.weightI32[5120 13824]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightI32[5120 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightI32[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.30.ffn_gate.weightI32[5120 13824]
-
blk.30.ffn_up.weightI32[5120 13824]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightI32[5120 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightI32[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.31.ffn_gate.weightI32[5120 13824]
-
blk.31.ffn_up.weightI32[5120 13824]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightI32[5120 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightI32[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.32.ffn_gate.weightI32[5120 13824]
-
blk.32.ffn_up.weightI32[5120 13824]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightI32[5120 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightI32[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.33.ffn_gate.weightI32[5120 13824]
-
blk.33.ffn_up.weightI32[5120 13824]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightI32[5120 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightI32[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.34.ffn_gate.weightI32[5120 13824]
-
blk.34.ffn_up.weightI32[5120 13824]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightI32[5120 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightI32[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.35.ffn_gate.weightI32[5120 13824]
-
blk.35.ffn_up.weightI32[5120 13824]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightI32[5120 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightI32[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.36.ffn_gate.weightI32[5120 13824]
-
blk.36.ffn_up.weightI32[5120 13824]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightI32[5120 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightI32[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.37.ffn_gate.weightI32[5120 13824]
-
blk.37.ffn_up.weightI32[5120 13824]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightI32[5120 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightI32[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.38.ffn_gate.weightI32[5120 13824]
-
blk.38.ffn_up.weightI32[5120 13824]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightI32[5120 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightI32[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.39.ffn_gate.weightI32[5120 13824]
-
blk.39.ffn_up.weightI32[5120 13824]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightI32[5120 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightI32[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.40.ffn_gate.weightI32[5120 13824]
-
blk.40.ffn_up.weightI32[5120 13824]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightI32[5120 1024]
-
blk.40.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightI32[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.41.ffn_gate.weightI32[5120 13824]
-
blk.41.ffn_up.weightI32[5120 13824]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightI32[5120 1024]
-
blk.41.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightI32[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.42.ffn_gate.weightI32[5120 13824]
-
blk.42.ffn_up.weightI32[5120 13824]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightI32[5120 1024]
-
blk.42.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightI32[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[5120 1024]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.43.ffn_gate.weightI32[5120 13824]
-
blk.43.ffn_up.weightI32[5120 13824]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightI32[5120 1024]
-
blk.43.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightI32[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.44.ffn_gate.weightI32[5120 13824]
-
blk.44.ffn_up.weightI32[5120 13824]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightI32[5120 1024]
-
blk.44.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightI32[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.45.ffn_gate.weightI32[5120 13824]
-
blk.45.ffn_up.weightI32[5120 13824]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightI32[5120 1024]
-
blk.45.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightI32[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.46.ffn_gate.weightI32[5120 13824]
-
blk.46.ffn_up.weightI32[5120 13824]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightI32[5120 1024]
-
blk.46.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightI32[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[5120 1024]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.47.ffn_gate.weight(!unknown_type 21!)[5120 13824]
-
blk.47.ffn_up.weight(!unknown_type 21!)[5120 13824]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightI32[5120 1024]
-
blk.47.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightI32[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[5120 1024]
-
output.weightQ6_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47