Polish LLM - Bielik-11B-v2.3-Instruct ~ by SpeakLeash a.k.a Spichlerz!
137 Pulls Updated 2 months ago
600ed73347c3 · 4.3GB
-
general.architecturellama
-
general.base_model.count0
-
general.file_type23
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.tags[mergekit, merge]
-
general.typemodel
-
general.version0-2
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.0.attn_v.weightQ4_K[4096, 1024]
-
blk.0.ffn_down.weightI32[14336, 4096]
-
blk.0.ffn_gate.weightI32[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weightI32[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.1.attn_v.weightQ4_K[4096, 1024]
-
blk.1.ffn_down.weightI32[14336, 4096]
-
blk.1.ffn_gate.weightI32[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weightI32[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.2.attn_v.weightQ4_K[4096, 1024]
-
blk.2.ffn_down.weightI32[14336, 4096]
-
blk.2.ffn_gate.weightI32[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weightI32[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.3.attn_v.weightQ4_K[4096, 1024]
-
blk.3.ffn_down.weightI32[14336, 4096]
-
blk.3.ffn_gate.weightI32[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weightI32[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.4.attn_v.weightQ4_K[4096, 1024]
-
blk.4.ffn_down.weightI32[14336, 4096]
-
blk.4.ffn_gate.weightI32[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weightI32[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.5.attn_v.weightQ4_K[4096, 1024]
-
blk.5.ffn_down.weightI32[14336, 4096]
-
blk.5.ffn_gate.weightI32[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weightI32[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.6.attn_v.weightQ4_K[4096, 1024]
-
blk.6.ffn_down.weightI32[14336, 4096]
-
blk.6.ffn_gate.weightI32[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weightI32[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.7.attn_v.weightQ4_K[4096, 1024]
-
blk.7.ffn_down.weightI32[14336, 4096]
-
blk.7.ffn_gate.weightI32[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weightI32[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.8.attn_v.weightQ4_K[4096, 1024]
-
blk.8.ffn_down.weightI32[14336, 4096]
-
blk.8.ffn_gate.weightI32[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weightI32[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.9.attn_v.weightQ4_K[4096, 1024]
-
blk.9.ffn_down.weightI32[14336, 4096]
-
blk.9.ffn_gate.weightI32[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weightI32[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.10.attn_v.weightQ4_K[4096, 1024]
-
blk.10.ffn_down.weightI32[14336, 4096]
-
blk.10.ffn_gate.weightI32[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weightI32[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.11.attn_v.weightQ4_K[4096, 1024]
-
blk.11.ffn_down.weightI32[14336, 4096]
-
blk.11.ffn_gate.weightI32[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weightI32[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.12.attn_v.weightQ4_K[4096, 1024]
-
blk.12.ffn_down.weightI32[14336, 4096]
-
blk.12.ffn_gate.weightI32[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weightI32[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.13.attn_v.weightQ4_K[4096, 1024]
-
blk.13.ffn_down.weightI32[14336, 4096]
-
blk.13.ffn_gate.weightI32[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weightI32[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.14.attn_v.weightQ4_K[4096, 1024]
-
blk.14.ffn_down.weightI32[14336, 4096]
-
blk.14.ffn_gate.weightI32[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weightI32[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.15.attn_v.weightQ4_K[4096, 1024]
-
blk.15.ffn_down.weightI32[14336, 4096]
-
blk.15.ffn_gate.weightI32[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weightI32[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.16.attn_v.weightQ4_K[4096, 1024]
-
blk.16.ffn_down.weightI32[14336, 4096]
-
blk.16.ffn_gate.weightI32[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weightI32[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.17.attn_v.weightQ4_K[4096, 1024]
-
blk.17.ffn_down.weightI32[14336, 4096]
-
blk.17.ffn_gate.weightI32[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weightI32[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.18.attn_v.weightQ4_K[4096, 1024]
-
blk.18.ffn_down.weightI32[14336, 4096]
-
blk.18.ffn_gate.weightI32[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weightI32[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.19.attn_v.weightQ4_K[4096, 1024]
-
blk.19.ffn_down.weightI32[14336, 4096]
-
blk.19.ffn_gate.weightI32[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weightI32[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.20.attn_v.weightQ4_K[4096, 1024]
-
blk.20.ffn_down.weightI32[14336, 4096]
-
blk.20.ffn_gate.weightI32[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weightI32[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.21.attn_v.weightQ4_K[4096, 1024]
-
blk.21.ffn_down.weightI32[14336, 4096]
-
blk.21.ffn_gate.weightI32[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weightI32[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.22.attn_v.weightQ4_K[4096, 1024]
-
blk.22.ffn_down.weightI32[14336, 4096]
-
blk.22.ffn_gate.weightI32[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weightI32[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.23.attn_v.weightQ4_K[4096, 1024]
-
blk.23.ffn_down.weightI32[14336, 4096]
-
blk.23.ffn_gate.weightI32[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weightI32[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.24.attn_v.weightQ4_K[4096, 1024]
-
blk.24.ffn_down.weightI32[14336, 4096]
-
blk.24.ffn_gate.weightI32[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weightI32[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.25.attn_v.weightQ4_K[4096, 1024]
-
blk.25.ffn_down.weightI32[14336, 4096]
-
blk.25.ffn_gate.weightI32[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weightI32[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.26.attn_v.weightQ4_K[4096, 1024]
-
blk.26.ffn_down.weightI32[14336, 4096]
-
blk.26.ffn_gate.weightI32[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weightI32[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.27.attn_v.weightQ4_K[4096, 1024]
-
blk.27.ffn_down.weightI32[14336, 4096]
-
blk.27.ffn_gate.weightI32[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weightI32[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.28.attn_v.weightQ4_K[4096, 1024]
-
blk.28.ffn_down.weightI32[14336, 4096]
-
blk.28.ffn_gate.weightI32[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weightI32[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.29.attn_v.weightQ4_K[4096, 1024]
-
blk.29.ffn_down.weightI32[14336, 4096]
-
blk.29.ffn_gate.weightI32[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weightI32[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.30.attn_v.weightQ4_K[4096, 1024]
-
blk.30.ffn_down.weightI32[14336, 4096]
-
blk.30.ffn_gate.weightI32[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weightI32[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.31.attn_v.weightQ4_K[4096, 1024]
-
blk.31.ffn_down.weightI32[14336, 4096]
-
blk.31.ffn_gate.weightI32[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weightI32[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.32.attn_v.weightQ4_K[4096, 1024]
-
blk.32.ffn_down.weightI32[14336, 4096]
-
blk.32.ffn_gate.weightI32[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weightI32[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.33.attn_v.weightQ4_K[4096, 1024]
-
blk.33.ffn_down.weightI32[14336, 4096]
-
blk.33.ffn_gate.weightI32[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weightI32[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.34.attn_v.weightQ4_K[4096, 1024]
-
blk.34.ffn_down.weightI32[14336, 4096]
-
blk.34.ffn_gate.weightI32[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weightI32[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.35.attn_v.weightQ4_K[4096, 1024]
-
blk.35.ffn_down.weightI32[14336, 4096]
-
blk.35.ffn_gate.weightI32[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weightI32[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.36.attn_v.weightQ4_K[4096, 1024]
-
blk.36.ffn_down.weightI32[14336, 4096]
-
blk.36.ffn_gate.weightI32[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weightI32[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.37.attn_v.weightQ4_K[4096, 1024]
-
blk.37.ffn_down.weightI32[14336, 4096]
-
blk.37.ffn_gate.weightI32[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weightI32[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.38.attn_v.weightQ4_K[4096, 1024]
-
blk.38.ffn_down.weightI32[14336, 4096]
-
blk.38.ffn_gate.weightI32[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weightI32[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.39.attn_v.weightQ4_K[4096, 1024]
-
blk.39.ffn_down.weightI32[14336, 4096]
-
blk.39.ffn_gate.weightI32[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weightI32[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.40.attn_v.weightQ4_K[4096, 1024]
-
blk.40.ffn_down.weightI32[14336, 4096]
-
blk.40.ffn_gate.weightI32[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weightI32[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.41.attn_v.weightQ4_K[4096, 1024]
-
blk.41.ffn_down.weightI32[14336, 4096]
-
blk.41.ffn_gate.weightI32[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weightI32[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.42.attn_v.weightQ4_K[4096, 1024]
-
blk.42.ffn_down.weightI32[14336, 4096]
-
blk.42.ffn_gate.weightI32[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weightI32[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.43.attn_v.weightQ4_K[4096, 1024]
-
blk.43.ffn_down.weightI32[14336, 4096]
-
blk.43.ffn_gate.weightI32[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weightI32[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.44.attn_v.weightQ4_K[4096, 1024]
-
blk.44.ffn_down.weightI32[14336, 4096]
-
blk.44.ffn_gate.weightI32[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weightI32[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.45.attn_v.weightQ4_K[4096, 1024]
-
blk.45.ffn_down.weightI32[14336, 4096]
-
blk.45.ffn_gate.weightI32[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weightI32[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.46.attn_v.weightQ4_K[4096, 1024]
-
blk.46.ffn_down.weightI32[14336, 4096]
-
blk.46.ffn_gate.weightI32[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weightI32[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.47.attn_v.weightQ4_K[4096, 1024]
-
blk.47.ffn_down.weightI32[14336, 4096]
-
blk.47.ffn_gate.weightI32[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weightI32[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.48.attn_v.weightQ4_K[4096, 1024]
-
blk.48.ffn_down.weightI32[14336, 4096]
-
blk.48.ffn_gate.weightI32[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weightI32[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 22!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weight(!unknown_type 21!)[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 22!)[4096, 4096]
-
blk.49.attn_v.weightQ4_K[4096, 1024]
-
blk.49.ffn_down.weightI32[14336, 4096]
-
blk.49.ffn_gate.weightI32[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weightI32[4096, 14336]
-
output.weightQ5_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49