Polish LLM - Bielik-11B-v2.2-Instruct ~ by SpeakLeash a.k.a Spichlerz!
163 Pulls Updated 3 months ago
21ccbc9d0305 · 6.0GB
-
general.architecturellama
-
general.basenamedpo7
-
general.file_type30
-
general.finetune007.3k
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_v.weightQ5_K[4096, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_v.weightQ5_K[4096, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_v.weightQ5_K[4096, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_v.weightQ5_K[4096, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_v.weightQ5_K[4096, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_v.weightQ5_K[4096, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_v.weightQ5_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_v.weightQ5_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_v.weightQ5_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_v.weightQ5_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_v.weightQ5_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_v.weightQ5_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_v.weightQ5_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_v.weightQ5_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_v.weightQ5_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_v.weightQ5_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_v.weightQ5_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_v.weightQ5_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_v.weightQ5_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_v.weightQ5_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_v.weightQ5_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_v.weightQ5_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_v.weightQ5_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_v.weightQ5_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_v.weightQ5_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_v.weightQ5_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_v.weightQ5_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_v.weightQ5_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_v.weightQ5_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_v.weightQ5_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_v.weightQ5_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_v.weightQ5_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.32.attn_v.weightQ5_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.33.attn_v.weightQ5_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.34.attn_v.weightQ5_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.35.attn_v.weightQ5_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.36.attn_v.weightQ5_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.37.attn_v.weightQ5_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.38.attn_v.weightQ5_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.39.attn_v.weightQ5_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.40.attn_v.weightQ5_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.41.attn_v.weightQ5_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.42.attn_v.weightQ5_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.43.attn_v.weightQ5_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.44.attn_v.weightQ5_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.45.attn_v.weightQ5_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.46.attn_v.weightQ5_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.47.attn_v.weightQ5_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.48.attn_v.weightQ5_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 23!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.49.attn_v.weightQ5_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 23!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 23!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 23!)[4096, 14336]
-
output.weightQ6_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49