The powerful Solar based model by Nous Research that excels at scientific discussion and coding tasks.
63 Pulls Updated 5 months ago
70735e7d25f7 · 5.8GB
-
general.architecturellama
-
general.file_type30
-
general.name..
-
general.quantization_version2
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length4096
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32002
-
quantize.imatrix.chunks_count200
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/groups_merged.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[4096, 32002]
-
blk.0.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_v.weightQ5_K[4096, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_v.weightQ5_K[4096, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_v.weightQ5_K[4096, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_v.weightQ5_K[4096, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_v.weightQ5_K[4096, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_v.weightQ5_K[4096, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_v.weightQ5_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_v.weightQ5_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_v.weightQ5_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_v.weightQ5_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_v.weightQ5_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_v.weightQ5_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_v.weightQ5_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_v.weightQ5_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_v.weightQ5_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_v.weightQ5_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_v.weightQ5_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_v.weightQ5_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_v.weightQ5_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_v.weightQ5_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_v.weightQ5_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_v.weightQ5_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_v.weightQ5_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_v.weightQ5_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_v.weightQ5_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_v.weightQ5_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_v.weightQ5_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_v.weightQ5_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_v.weightQ5_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_v.weightQ5_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_v.weightQ5_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_v.weightQ5_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_v.weightQ5_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_v.weightQ5_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_v.weightQ5_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_v.weightQ5_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_v.weightQ5_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_v.weightQ5_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_v.weightQ5_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_v.weightQ5_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_v.weightQ5_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_v.weightQ5_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_v.weightQ5_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_v.weightQ5_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_v.weightQ5_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_v.weightQ5_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_v.weightQ5_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_v.weightQ5_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
output.weightQ6_K[4096, 32002]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47