Polish LLM - Bielik-11B-v2.1-Instruct ~ by SpeakLeash a.k.a Spichlerz!
6 Pulls Updated 3 months ago
66d4cfe41925 · 2.7GB
-
general.architecturellama
-
general.file_type31
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
general.version2.1
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weightI8[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.0.attn_v.weightQ4_K[4096, 1024]
-
blk.0.ffn_down.weightQ2_K[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weightI8[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.1.attn_v.weightQ4_K[4096, 1024]
-
blk.1.ffn_down.weightQ2_K[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weightI8[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.2.attn_v.weightQ4_K[4096, 1024]
-
blk.2.ffn_down.weightQ2_K[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weightI8[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.3.attn_v.weightQ4_K[4096, 1024]
-
blk.3.ffn_down.weightQ2_K[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weightI8[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.4.attn_v.weightQ4_K[4096, 1024]
-
blk.4.ffn_down.weightQ2_K[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weightI8[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.5.attn_v.weightQ4_K[4096, 1024]
-
blk.5.ffn_down.weightQ2_K[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weightI8[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.6.attn_v.weightQ4_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weightI8[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.7.attn_v.weightQ4_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weightI8[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.8.attn_v.weightQ4_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weightI8[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.9.attn_v.weightQ4_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weightI8[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.10.attn_v.weightQ4_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weightI8[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.11.attn_v.weightQ4_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weightI8[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.12.attn_v.weightQ4_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weightI8[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.13.attn_v.weightQ4_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weightI8[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.14.attn_v.weightQ4_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weightI8[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.15.attn_v.weightQ4_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weightI8[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.16.attn_v.weightQ4_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weightI8[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.17.attn_v.weightQ4_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weightI8[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.18.attn_v.weightQ4_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weightI8[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.19.attn_v.weightQ4_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weightI8[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.20.attn_v.weightQ4_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weightI8[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.21.attn_v.weightQ4_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weightI8[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.22.attn_v.weightQ4_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weightI8[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.23.attn_v.weightQ4_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weightI8[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.24.attn_v.weightQ4_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weightI8[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.25.attn_v.weightQ4_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weightI8[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.26.attn_v.weightQ4_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weightI8[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.27.attn_v.weightQ4_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weightI8[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.28.attn_v.weightQ4_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weightI8[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.29.attn_v.weightQ4_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weightI8[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.30.attn_v.weightQ4_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weightI8[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.31.attn_v.weightQ4_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weightI8[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.32.attn_v.weightQ4_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weightI8[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.33.attn_v.weightQ4_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weightI8[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.34.attn_v.weightQ4_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weightI8[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.35.attn_v.weightQ4_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weightI8[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.36.attn_v.weightQ4_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weightI8[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.37.attn_v.weightQ4_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weightI8[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.38.attn_v.weightQ4_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weightI8[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.39.attn_v.weightQ4_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weightI8[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.40.attn_v.weightQ4_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weightI8[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.41.attn_v.weightQ4_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weightI8[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.42.attn_v.weightQ4_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weightI8[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.43.attn_v.weightQ4_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weightI8[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.44.attn_v.weightQ4_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weightI8[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.45.attn_v.weightQ4_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weightI8[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.46.attn_v.weightQ4_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weightI8[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.47.attn_v.weightQ4_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weightI8[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.48.attn_v.weightQ4_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weightI8[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.49.attn_v.weightQ4_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
output.weightQ5_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49