90 Pulls Updated 3 weeks ago
eb114bf96e58 · 2.7GB
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
general.architecturellama
-
general.file_typeBF16
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096 32128]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ2_K[14336 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.0.attn_output.weightI8[4096 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.0.attn_v.weightQ4_K[4096 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ2_K[14336 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.1.attn_output.weightI8[4096 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.1.attn_v.weightQ4_K[4096 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ2_K[14336 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.2.attn_output.weightI8[4096 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.2.attn_v.weightQ4_K[4096 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ2_K[14336 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.3.attn_output.weightI8[4096 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.3.attn_v.weightQ4_K[4096 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ2_K[14336 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.4.attn_output.weightI8[4096 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.4.attn_v.weightQ4_K[4096 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ2_K[14336 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.5.attn_output.weightI8[4096 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.5.attn_v.weightQ4_K[4096 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.6.attn_output.weightI8[4096 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.6.attn_v.weightQ4_K[4096 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.7.attn_output.weightI8[4096 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.7.attn_v.weightQ4_K[4096 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.8.attn_output.weightI8[4096 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.8.attn_v.weightQ4_K[4096 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.9.attn_output.weightI8[4096 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.9.attn_v.weightQ4_K[4096 1024]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.10.attn_output.weightI8[4096 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.10.attn_v.weightQ4_K[4096 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.11.attn_output.weightI8[4096 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.11.attn_v.weightQ4_K[4096 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.12.attn_output.weightI8[4096 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.12.attn_v.weightQ4_K[4096 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.13.attn_output.weightI8[4096 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.13.attn_v.weightQ4_K[4096 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.14.attn_output.weightI8[4096 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.14.attn_v.weightQ4_K[4096 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.15.attn_output.weightI8[4096 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.15.attn_v.weightQ4_K[4096 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.16.attn_output.weightI8[4096 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.16.attn_v.weightQ4_K[4096 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.17.attn_output.weightI8[4096 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.17.attn_v.weightQ4_K[4096 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.18.attn_output.weightI8[4096 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.18.attn_v.weightQ4_K[4096 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.19.attn_output.weightI8[4096 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.19.attn_v.weightQ4_K[4096 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.20.attn_output.weightI8[4096 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.20.attn_v.weightQ4_K[4096 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.21.attn_output.weightI8[4096 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.21.attn_v.weightQ4_K[4096 1024]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.22.attn_output.weightI8[4096 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.22.attn_v.weightQ4_K[4096 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.23.attn_output.weightI8[4096 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.23.attn_v.weightQ4_K[4096 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.24.attn_output.weightI8[4096 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.24.attn_v.weightQ4_K[4096 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.25.attn_output.weightI8[4096 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.25.attn_v.weightQ4_K[4096 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.26.attn_output.weightI8[4096 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.26.attn_v.weightQ4_K[4096 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.27.attn_output.weightI8[4096 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.27.attn_v.weightQ4_K[4096 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.28.attn_output.weightI8[4096 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.28.attn_v.weightQ4_K[4096 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.29.attn_output.weightI8[4096 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.29.attn_v.weightQ4_K[4096 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.30.attn_output.weightI8[4096 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.30.attn_v.weightQ4_K[4096 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.31.attn_output.weightI8[4096 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.31.attn_v.weightQ4_K[4096 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.32.attn_output.weightI8[4096 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.32.attn_v.weightQ4_K[4096 1024]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.33.attn_output.weightI8[4096 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.33.attn_v.weightQ4_K[4096 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.34.attn_output.weightI8[4096 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.34.attn_v.weightQ4_K[4096 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.35.attn_output.weightI8[4096 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.35.attn_v.weightQ4_K[4096 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.36.attn_output.weightI8[4096 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.36.attn_v.weightQ4_K[4096 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.37.attn_output.weightI8[4096 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.37.attn_v.weightQ4_K[4096 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.38.attn_output.weightI8[4096 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.38.attn_v.weightQ4_K[4096 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.39.attn_output.weightI8[4096 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.39.attn_v.weightQ4_K[4096 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.40.attn_output.weightI8[4096 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.40.attn_v.weightQ4_K[4096 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.41.attn_output.weightI8[4096 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.41.attn_v.weightQ4_K[4096 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.42.attn_output.weightI8[4096 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.42.attn_v.weightQ4_K[4096 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.43.attn_output.weightI8[4096 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.43.attn_v.weightQ4_K[4096 1024]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.44.attn_output.weightI8[4096 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.44.attn_v.weightQ4_K[4096 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.45.attn_output.weightI8[4096 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.45.attn_v.weightQ4_K[4096 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.46.attn_output.weightI8[4096 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.46.attn_v.weightQ4_K[4096 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.47.attn_output.weightI8[4096 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.47.attn_v.weightQ4_K[4096 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.48.attn_output.weightI8[4096 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.48.attn_v.weightQ4_K[4096 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096 14336]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096 1024]
-
blk.49.attn_output.weightI8[4096 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096 4096]
-
blk.49.attn_v.weightQ4_K[4096 1024]
-
output.weightQ5_K[4096 32128]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49