Polish LLM - Bielik-11B-v2.3-Instruct ~ by SpeakLeash a.k.a Spichlerz!
46 Pulls Updated 2 weeks ago
6c1703072cc5 · 2.7GB
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
general.architecturellama
-
general.file_typeBF16
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096 32128]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ2_K[14336 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.0.attn_output.weightI8[4096 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.0.attn_v.weightQ4_K[4096 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ2_K[14336 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.1.attn_output.weightI8[4096 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.1.attn_v.weightQ4_K[4096 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.2.attn_output.weightI8[4096 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.2.attn_v.weightQ4_K[4096 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.3.attn_output.weightI8[4096 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.3.attn_v.weightQ4_K[4096 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.4.attn_output.weightI8[4096 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.4.attn_v.weightQ4_K[4096 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.5.attn_output.weightI8[4096 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.5.attn_v.weightQ4_K[4096 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.6.attn_output.weightI8[4096 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.6.attn_v.weightQ4_K[4096 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.7.attn_output.weightI8[4096 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.7.attn_v.weightQ4_K[4096 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.8.attn_output.weightI8[4096 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.8.attn_v.weightQ4_K[4096 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.9.attn_output.weightI8[4096 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.9.attn_v.weightQ4_K[4096 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ2_K[14336 4096]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.10.attn_output.weightI8[4096 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.10.attn_v.weightQ4_K[4096 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ2_K[14336 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.11.attn_output.weightI8[4096 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.11.attn_v.weightQ4_K[4096 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ2_K[14336 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.12.attn_output.weightI8[4096 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.12.attn_v.weightQ4_K[4096 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ2_K[14336 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.13.attn_output.weightI8[4096 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.13.attn_v.weightQ4_K[4096 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.14.attn_output.weightI8[4096 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.14.attn_v.weightQ4_K[4096 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.15.attn_output.weightI8[4096 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.15.attn_v.weightQ4_K[4096 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.16.attn_output.weightI8[4096 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.16.attn_v.weightQ4_K[4096 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.17.attn_output.weightI8[4096 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.17.attn_v.weightQ4_K[4096 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.18.attn_output.weightI8[4096 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.18.attn_v.weightQ4_K[4096 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.19.attn_output.weightI8[4096 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.19.attn_v.weightQ4_K[4096 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.20.attn_output.weightI8[4096 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.20.attn_v.weightQ4_K[4096 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.21.attn_output.weightI8[4096 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.21.attn_v.weightQ4_K[4096 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.22.attn_output.weightI8[4096 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.22.attn_v.weightQ4_K[4096 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.23.attn_output.weightI8[4096 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.23.attn_v.weightQ4_K[4096 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.24.attn_output.weightI8[4096 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.24.attn_v.weightQ4_K[4096 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.25.attn_output.weightI8[4096 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.25.attn_v.weightQ4_K[4096 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.26.attn_output.weightI8[4096 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.26.attn_v.weightQ4_K[4096 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.27.attn_output.weightI8[4096 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.27.attn_v.weightQ4_K[4096 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.28.attn_output.weightI8[4096 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.28.attn_v.weightQ4_K[4096 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.29.attn_output.weightI8[4096 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.29.attn_v.weightQ4_K[4096 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.30.attn_output.weightI8[4096 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.30.attn_v.weightQ4_K[4096 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.31.attn_output.weightI8[4096 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.31.attn_v.weightQ4_K[4096 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.32.attn_output.weightI8[4096 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.32.attn_v.weightQ4_K[4096 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.33.attn_output.weightI8[4096 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.33.attn_v.weightQ4_K[4096 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.34.attn_output.weightI8[4096 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.34.attn_v.weightQ4_K[4096 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.35.attn_output.weightI8[4096 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.35.attn_v.weightQ4_K[4096 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.36.attn_output.weightI8[4096 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.36.attn_v.weightQ4_K[4096 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.37.attn_output.weightI8[4096 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.37.attn_v.weightQ4_K[4096 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.38.attn_output.weightI8[4096 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.38.attn_v.weightQ4_K[4096 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.39.attn_output.weightI8[4096 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.39.attn_v.weightQ4_K[4096 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.40.attn_output.weightI8[4096 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.40.attn_v.weightQ4_K[4096 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.41.attn_output.weightI8[4096 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.41.attn_v.weightQ4_K[4096 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.42.attn_output.weightI8[4096 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.42.attn_v.weightQ4_K[4096 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.43.attn_output.weightI8[4096 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.43.attn_v.weightQ4_K[4096 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.44.attn_output.weightI8[4096 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.44.attn_v.weightQ4_K[4096 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.45.attn_output.weightI8[4096 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.45.attn_v.weightQ4_K[4096 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.46.attn_output.weightI8[4096 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.46.attn_v.weightQ4_K[4096 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.47.attn_output.weightI8[4096 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.47.attn_v.weightQ4_K[4096 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.48.attn_output.weightI8[4096 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.48.attn_v.weightQ4_K[4096 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.49.attn_output.weightI8[4096 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.49.attn_v.weightQ4_K[4096 1024]
-
output.weightQ5_K[4096 32128]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49