Arcee-SuperNova-Medius is a 14B parameter language model developed by Arcee.ai, built on the Qwen2.5-14B-Instruct architecture.
Tools
14B
139 Pulls Updated 4 days ago
bfb23b90e821 · 5.0GB
-
quantize.imatrix.chunks_count128
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.file/models_out/SuperNova-14B-GGUF/SuperNova-14B.imatrix
-
general.architectureqwen2
-
general.file_typeIQ4_XS
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-05
-
qwen2.block_count48
-
qwen2.context_length131072
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length13824
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.0.ffn_gate.weightI16[5120 13824]
-
blk.0.ffn_up.weightI16[5120 13824]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightI16[5120 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightI16[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.1.ffn_gate.weightI16[5120 13824]
-
blk.1.ffn_up.weightI16[5120 13824]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightI16[5120 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightI16[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightI16[13824 5120]
-
blk.2.ffn_gate.weightI16[5120 13824]
-
blk.2.ffn_up.weightI16[5120 13824]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightI16[5120 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightI16[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightI16[13824 5120]
-
blk.3.ffn_gate.weightI16[5120 13824]
-
blk.3.ffn_up.weightI16[5120 13824]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightI16[5120 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightI16[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightI16[13824 5120]
-
blk.4.ffn_gate.weightI16[5120 13824]
-
blk.4.ffn_up.weightI16[5120 13824]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightI16[5120 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightI16[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightI16[13824 5120]
-
blk.5.ffn_gate.weightI16[5120 13824]
-
blk.5.ffn_up.weightI16[5120 13824]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightI16[5120 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightI16[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightI16[13824 5120]
-
blk.6.ffn_gate.weightI16[5120 13824]
-
blk.6.ffn_up.weightI16[5120 13824]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightI16[5120 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightI16[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightI16[13824 5120]
-
blk.7.ffn_gate.weightI16[5120 13824]
-
blk.7.ffn_up.weightI16[5120 13824]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightI16[5120 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightI16[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightI16[13824 5120]
-
blk.8.ffn_gate.weightI16[5120 13824]
-
blk.8.ffn_up.weightI16[5120 13824]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightI16[5120 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightI16[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightI16[13824 5120]
-
blk.9.ffn_gate.weightI16[5120 13824]
-
blk.9.ffn_up.weightI16[5120 13824]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightI16[5120 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightI16[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.10.ffn_gate.weightI16[5120 13824]
-
blk.10.ffn_up.weightI16[5120 13824]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightI16[5120 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightI16[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.11.ffn_gate.weightI16[5120 13824]
-
blk.11.ffn_up.weightI16[5120 13824]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightI16[5120 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightI16[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.12.ffn_gate.weightI16[5120 13824]
-
blk.12.ffn_up.weightI16[5120 13824]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightI16[5120 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightI16[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weight(!unknown_type 21!)[13824 5120]
-
blk.13.ffn_gate.weightI16[5120 13824]
-
blk.13.ffn_up.weightI16[5120 13824]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightI16[5120 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightI16[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightI16[13824 5120]
-
blk.14.ffn_gate.weightI16[5120 13824]
-
blk.14.ffn_up.weightI16[5120 13824]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightI16[5120 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightI16[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightI16[13824 5120]
-
blk.15.ffn_gate.weightI16[5120 13824]
-
blk.15.ffn_up.weightI16[5120 13824]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightI16[5120 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightI16[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightI16[13824 5120]
-
blk.16.ffn_gate.weightI16[5120 13824]
-
blk.16.ffn_up.weightI16[5120 13824]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightI16[5120 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightI16[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightI16[13824 5120]
-
blk.17.ffn_gate.weightI16[5120 13824]
-
blk.17.ffn_up.weightI16[5120 13824]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightI16[5120 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightI16[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightI16[13824 5120]
-
blk.18.ffn_gate.weightI16[5120 13824]
-
blk.18.ffn_up.weightI16[5120 13824]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightI16[5120 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightI16[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightI16[13824 5120]
-
blk.19.ffn_gate.weightI16[5120 13824]
-
blk.19.ffn_up.weightI16[5120 13824]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightI16[5120 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightI16[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightI16[13824 5120]
-
blk.20.ffn_gate.weightI16[5120 13824]
-
blk.20.ffn_up.weightI16[5120 13824]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightI16[5120 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightI16[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightI16[13824 5120]
-
blk.21.ffn_gate.weightI16[5120 13824]
-
blk.21.ffn_up.weightI16[5120 13824]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightI16[5120 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightI16[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightI16[13824 5120]
-
blk.22.ffn_gate.weightI16[5120 13824]
-
blk.22.ffn_up.weightI16[5120 13824]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightI16[5120 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightI16[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightI16[13824 5120]
-
blk.23.ffn_gate.weightI16[5120 13824]
-
blk.23.ffn_up.weightI16[5120 13824]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightI16[5120 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightI16[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightI16[13824 5120]
-
blk.24.ffn_gate.weightI16[5120 13824]
-
blk.24.ffn_up.weightI16[5120 13824]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightI16[5120 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightI16[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightI16[13824 5120]
-
blk.25.ffn_gate.weightI16[5120 13824]
-
blk.25.ffn_up.weightI16[5120 13824]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightI16[5120 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightI16[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightI16[13824 5120]
-
blk.26.ffn_gate.weightI16[5120 13824]
-
blk.26.ffn_up.weightI16[5120 13824]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightI16[5120 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightI16[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightI16[13824 5120]
-
blk.27.ffn_gate.weightI16[5120 13824]
-
blk.27.ffn_up.weightI16[5120 13824]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightI16[5120 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightI16[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightI16[13824 5120]
-
blk.28.ffn_gate.weightI16[5120 13824]
-
blk.28.ffn_up.weightI16[5120 13824]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightI16[5120 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightI16[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightI16[13824 5120]
-
blk.29.ffn_gate.weightI16[5120 13824]
-
blk.29.ffn_up.weightI16[5120 13824]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightI16[5120 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightI16[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightI16[13824 5120]
-
blk.30.ffn_gate.weightI16[5120 13824]
-
blk.30.ffn_up.weightI16[5120 13824]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightI16[5120 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightI16[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightI16[13824 5120]
-
blk.31.ffn_gate.weightI16[5120 13824]
-
blk.31.ffn_up.weightI16[5120 13824]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightI16[5120 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightI16[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightI16[13824 5120]
-
blk.32.ffn_gate.weightI16[5120 13824]
-
blk.32.ffn_up.weightI16[5120 13824]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightI16[5120 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightI16[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightI16[13824 5120]
-
blk.33.ffn_gate.weightI16[5120 13824]
-
blk.33.ffn_up.weightI16[5120 13824]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightI16[5120 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightI16[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightI16[13824 5120]
-
blk.34.ffn_gate.weightI16[5120 13824]
-
blk.34.ffn_up.weightI16[5120 13824]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightI16[5120 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightI16[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightI16[13824 5120]
-
blk.35.ffn_gate.weightI16[5120 13824]
-
blk.35.ffn_up.weightI16[5120 13824]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightI16[5120 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightI16[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightI16[13824 5120]
-
blk.36.ffn_gate.weightI16[5120 13824]
-
blk.36.ffn_up.weightI16[5120 13824]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightI16[5120 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightI16[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightI16[13824 5120]
-
blk.37.ffn_gate.weightI16[5120 13824]
-
blk.37.ffn_up.weightI16[5120 13824]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightI16[5120 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightI16[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightI16[13824 5120]
-
blk.38.ffn_gate.weightI16[5120 13824]
-
blk.38.ffn_up.weightI16[5120 13824]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightI16[5120 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightI16[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightI16[13824 5120]
-
blk.39.ffn_gate.weightI16[5120 13824]
-
blk.39.ffn_up.weightI16[5120 13824]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightI16[5120 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightI16[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightI16[13824 5120]
-
blk.40.ffn_gate.weightI16[5120 13824]
-
blk.40.ffn_up.weightI16[5120 13824]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightI16[5120 1024]
-
blk.40.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightI16[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightI16[13824 5120]
-
blk.41.ffn_gate.weightI16[5120 13824]
-
blk.41.ffn_up.weightI16[5120 13824]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightI16[5120 1024]
-
blk.41.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightI16[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightI16[13824 5120]
-
blk.42.ffn_gate.weightI16[5120 13824]
-
blk.42.ffn_up.weightI16[5120 13824]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightI16[5120 1024]
-
blk.42.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightI16[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[5120 1024]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightI16[13824 5120]
-
blk.43.ffn_gate.weightI16[5120 13824]
-
blk.43.ffn_up.weightI16[5120 13824]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightI16[5120 1024]
-
blk.43.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightI16[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightI16[13824 5120]
-
blk.44.ffn_gate.weightI16[5120 13824]
-
blk.44.ffn_up.weightI16[5120 13824]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightI16[5120 1024]
-
blk.44.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightI16[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightI16[13824 5120]
-
blk.45.ffn_gate.weightI16[5120 13824]
-
blk.45.ffn_up.weightI16[5120 13824]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightI16[5120 1024]
-
blk.45.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightI16[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightI16[13824 5120]
-
blk.46.ffn_gate.weightI16[5120 13824]
-
blk.46.ffn_up.weightI16[5120 13824]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightI16[5120 1024]
-
blk.46.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightI16[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[5120 1024]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightI16[13824 5120]
-
blk.47.ffn_gate.weightI16[5120 13824]
-
blk.47.ffn_up.weightI16[5120 13824]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightI16[5120 1024]
-
blk.47.attn_output.weight(!unknown_type 21!)[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightI16[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[5120 1024]
-
output.weightQ5_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47