Polish LLM - Bielik-11B-v2.0-Instruct ~ by SpeakLeash a.k.a Spichlerz!
12 Pulls Updated 2 months ago
3de90ad3761a · 2.7GB
-
general.architecturellama
-
general.file_type31
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
general.version2.0
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length8192
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weightI8[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.0.attn_v.weightQ4_K[4096, 1024]
-
blk.0.ffn_down.weightQ2_K[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weightI8[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.1.attn_v.weightQ4_K[4096, 1024]
-
blk.1.ffn_down.weightQ2_K[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weightI8[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.2.attn_v.weightQ4_K[4096, 1024]
-
blk.2.ffn_down.weightQ2_K[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weightI8[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.3.attn_v.weightQ4_K[4096, 1024]
-
blk.3.ffn_down.weightQ2_K[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weightI8[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.4.attn_v.weightQ4_K[4096, 1024]
-
blk.4.ffn_down.weightQ2_K[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weightI8[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.5.attn_v.weightQ4_K[4096, 1024]
-
blk.5.ffn_down.weightQ2_K[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weightI8[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.6.attn_v.weightQ4_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weightI8[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.7.attn_v.weightQ4_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weightI8[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.8.attn_v.weightQ4_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weightI8[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.9.attn_v.weightQ4_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weightI8[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.10.attn_v.weightQ4_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weightI8[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.11.attn_v.weightQ4_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weightI8[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.12.attn_v.weightQ4_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weightI8[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.13.attn_v.weightQ4_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weightI8[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.14.attn_v.weightQ4_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weightI8[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.15.attn_v.weightQ4_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weightI8[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.16.attn_v.weightQ4_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weightI8[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.17.attn_v.weightQ4_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weightI8[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.18.attn_v.weightQ4_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weightI8[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.19.attn_v.weightQ4_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weightI8[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.20.attn_v.weightQ4_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weightI8[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.21.attn_v.weightQ4_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weightI8[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.22.attn_v.weightQ4_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weightI8[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.23.attn_v.weightQ4_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weightI8[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.24.attn_v.weightQ4_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weightI8[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.25.attn_v.weightQ4_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weightI8[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.26.attn_v.weightQ4_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weightI8[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.27.attn_v.weightQ4_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weightI8[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.28.attn_v.weightQ4_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weightI8[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.29.attn_v.weightQ4_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weightI8[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.30.attn_v.weightQ4_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weightI8[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.31.attn_v.weightQ4_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weightI8[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.32.attn_v.weightQ4_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weightI8[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.33.attn_v.weightQ4_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weightI8[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.34.attn_v.weightQ4_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weightI8[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.35.attn_v.weightQ4_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weightI8[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.36.attn_v.weightQ4_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weightI8[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.37.attn_v.weightQ4_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weightI8[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.38.attn_v.weightQ4_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weightI8[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.39.attn_v.weightQ4_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weightI8[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.40.attn_v.weightQ4_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weightI8[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.41.attn_v.weightQ4_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weightI8[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.42.attn_v.weightQ4_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weightI8[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.43.attn_v.weightQ4_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weightI8[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.44.attn_v.weightQ4_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weightI8[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.45.attn_v.weightQ4_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weightI8[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.46.attn_v.weightQ4_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weightI8[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.47.attn_v.weightQ4_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weightI8[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.48.attn_v.weightQ4_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weightI8[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.49.attn_v.weightQ4_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
output.weightQ5_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49