Polish LLM - Bielik-11B-v2.0-Instruct ~ by SpeakLeash a.k.a Spichlerz!
3 Pulls Updated 6 weeks ago
aab6e7af9b02 · 6.0GB
-
general.architecturellama
-
general.file_type30
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
general.version2.0
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length8192
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_v.weightQ5_K[4096, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_v.weightQ5_K[4096, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_v.weightQ5_K[4096, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_v.weightQ5_K[4096, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_v.weightQ5_K[4096, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_v.weightQ5_K[4096, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_v.weightQ5_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_v.weightQ5_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_v.weightQ5_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_v.weightQ5_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_v.weightQ5_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_v.weightQ5_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_v.weightQ5_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_v.weightQ5_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_v.weightQ5_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_v.weightQ5_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_v.weightQ5_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_v.weightQ5_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_v.weightQ5_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_v.weightQ5_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_v.weightQ5_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_v.weightQ5_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_v.weightQ5_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_v.weightQ5_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_v.weightQ5_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_v.weightQ5_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_v.weightQ5_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_v.weightQ5_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_v.weightQ5_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_v.weightQ5_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_v.weightQ5_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_v.weightQ5_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_v.weightQ5_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_v.weightQ5_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_v.weightQ5_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_v.weightQ5_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_v.weightQ5_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_v.weightQ5_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_v.weightQ5_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_v.weightQ5_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_v.weightQ5_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_v.weightQ5_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_v.weightQ5_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_v.weightQ5_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_v.weightQ5_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_v.weightQ5_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_v.weightQ5_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_v.weightQ5_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.48.attn_v.weightQ5_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.49.attn_v.weightQ5_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
output.weightQ6_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49