2 Pulls Updated 9 days ago
f9ec0da8505d · 4.3GB
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
general.architecturellama
-
general.file_typeIQ3_XXS
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[4096 32128]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightI32[14336 4096]
-
blk.0.ffn_gate.weightI32[4096 14336]
-
blk.0.ffn_up.weightI32[4096 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.0.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.0.attn_v.weightQ4_K[4096 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightI32[14336 4096]
-
blk.1.ffn_gate.weightI32[4096 14336]
-
blk.1.ffn_up.weightI32[4096 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.1.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.1.attn_v.weightQ4_K[4096 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightI32[14336 4096]
-
blk.2.ffn_gate.weightI32[4096 14336]
-
blk.2.ffn_up.weightI32[4096 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.2.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.2.attn_v.weightQ4_K[4096 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightI32[14336 4096]
-
blk.3.ffn_gate.weightI32[4096 14336]
-
blk.3.ffn_up.weightI32[4096 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.3.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.3.attn_v.weightQ4_K[4096 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightI32[14336 4096]
-
blk.4.ffn_gate.weightI32[4096 14336]
-
blk.4.ffn_up.weightI32[4096 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.4.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.4.attn_v.weightQ4_K[4096 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightI32[14336 4096]
-
blk.5.ffn_gate.weightI32[4096 14336]
-
blk.5.ffn_up.weightI32[4096 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.5.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.5.attn_v.weightQ4_K[4096 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightI32[14336 4096]
-
blk.6.ffn_gate.weightI32[4096 14336]
-
blk.6.ffn_up.weightI32[4096 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.6.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.6.attn_v.weightQ4_K[4096 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightI32[14336 4096]
-
blk.7.ffn_gate.weightI32[4096 14336]
-
blk.7.ffn_up.weightI32[4096 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.7.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.7.attn_v.weightQ4_K[4096 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightI32[14336 4096]
-
blk.8.ffn_gate.weightI32[4096 14336]
-
blk.8.ffn_up.weightI32[4096 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.8.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.8.attn_v.weightQ4_K[4096 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightI32[14336 4096]
-
blk.9.ffn_gate.weightI32[4096 14336]
-
blk.9.ffn_up.weightI32[4096 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.9.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.9.attn_v.weightQ4_K[4096 1024]
-
blk.10.ffn_gate.weightI32[4096 14336]
-
blk.10.ffn_up.weightI32[4096 14336]
-
blk.10.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.10.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.10.attn_v.weightQ4_K[4096 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightI32[14336 4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightI32[14336 4096]
-
blk.11.ffn_gate.weightI32[4096 14336]
-
blk.11.ffn_up.weightI32[4096 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.11.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.11.attn_v.weightQ4_K[4096 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightI32[14336 4096]
-
blk.12.ffn_gate.weightI32[4096 14336]
-
blk.12.ffn_up.weightI32[4096 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.12.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.12.attn_v.weightQ4_K[4096 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightI32[14336 4096]
-
blk.13.ffn_gate.weightI32[4096 14336]
-
blk.13.ffn_up.weightI32[4096 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.13.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.13.attn_v.weightQ4_K[4096 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightI32[14336 4096]
-
blk.14.ffn_gate.weightI32[4096 14336]
-
blk.14.ffn_up.weightI32[4096 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.14.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.14.attn_v.weightQ4_K[4096 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightI32[14336 4096]
-
blk.15.ffn_gate.weightI32[4096 14336]
-
blk.15.ffn_up.weightI32[4096 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.15.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.15.attn_v.weightQ4_K[4096 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightI32[14336 4096]
-
blk.16.ffn_gate.weightI32[4096 14336]
-
blk.16.ffn_up.weightI32[4096 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.16.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.16.attn_v.weightQ4_K[4096 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightI32[14336 4096]
-
blk.17.ffn_gate.weightI32[4096 14336]
-
blk.17.ffn_up.weightI32[4096 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.17.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.17.attn_v.weightQ4_K[4096 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightI32[14336 4096]
-
blk.18.ffn_gate.weightI32[4096 14336]
-
blk.18.ffn_up.weightI32[4096 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.18.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.18.attn_v.weightQ4_K[4096 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightI32[14336 4096]
-
blk.19.ffn_gate.weightI32[4096 14336]
-
blk.19.ffn_up.weightI32[4096 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.19.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.19.attn_v.weightQ4_K[4096 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightI32[14336 4096]
-
blk.20.ffn_gate.weightI32[4096 14336]
-
blk.20.ffn_up.weightI32[4096 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.20.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.20.attn_v.weightQ4_K[4096 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightI32[14336 4096]
-
blk.21.ffn_gate.weightI32[4096 14336]
-
blk.21.ffn_up.weightI32[4096 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.21.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.21.attn_v.weightQ4_K[4096 1024]
-
blk.22.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.22.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.22.attn_v.weightQ4_K[4096 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightI32[14336 4096]
-
blk.22.ffn_gate.weightI32[4096 14336]
-
blk.22.ffn_up.weightI32[4096 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightI32[14336 4096]
-
blk.23.ffn_gate.weightI32[4096 14336]
-
blk.23.ffn_up.weightI32[4096 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.23.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.23.attn_v.weightQ4_K[4096 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightI32[14336 4096]
-
blk.24.ffn_gate.weightI32[4096 14336]
-
blk.24.ffn_up.weightI32[4096 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.24.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.24.attn_v.weightQ4_K[4096 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightI32[14336 4096]
-
blk.25.ffn_gate.weightI32[4096 14336]
-
blk.25.ffn_up.weightI32[4096 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.25.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.25.attn_v.weightQ4_K[4096 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightI32[14336 4096]
-
blk.26.ffn_gate.weightI32[4096 14336]
-
blk.26.ffn_up.weightI32[4096 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.26.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.26.attn_v.weightQ4_K[4096 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightI32[14336 4096]
-
blk.27.ffn_gate.weightI32[4096 14336]
-
blk.27.ffn_up.weightI32[4096 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.27.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.27.attn_v.weightQ4_K[4096 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightI32[14336 4096]
-
blk.28.ffn_gate.weightI32[4096 14336]
-
blk.28.ffn_up.weightI32[4096 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.28.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.28.attn_v.weightQ4_K[4096 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightI32[14336 4096]
-
blk.29.ffn_gate.weightI32[4096 14336]
-
blk.29.ffn_up.weightI32[4096 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.29.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.29.attn_v.weightQ4_K[4096 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightI32[14336 4096]
-
blk.30.ffn_gate.weightI32[4096 14336]
-
blk.30.ffn_up.weightI32[4096 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.30.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.30.attn_v.weightQ4_K[4096 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightI32[14336 4096]
-
blk.31.ffn_gate.weightI32[4096 14336]
-
blk.31.ffn_up.weightI32[4096 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.31.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.31.attn_v.weightQ4_K[4096 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weightI32[14336 4096]
-
blk.32.ffn_gate.weightI32[4096 14336]
-
blk.32.ffn_up.weightI32[4096 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.32.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.32.attn_v.weightQ4_K[4096 1024]
-
blk.33.ffn_gate.weightI32[4096 14336]
-
blk.33.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.33.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.33.attn_v.weightQ4_K[4096 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weightI32[14336 4096]
-
blk.33.ffn_up.weightI32[4096 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weightI32[14336 4096]
-
blk.34.ffn_gate.weightI32[4096 14336]
-
blk.34.ffn_up.weightI32[4096 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.34.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.34.attn_v.weightQ4_K[4096 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weightI32[14336 4096]
-
blk.35.ffn_gate.weightI32[4096 14336]
-
blk.35.ffn_up.weightI32[4096 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.35.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.35.attn_v.weightQ4_K[4096 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weightI32[14336 4096]
-
blk.36.ffn_gate.weightI32[4096 14336]
-
blk.36.ffn_up.weightI32[4096 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.36.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.36.attn_v.weightQ4_K[4096 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weightI32[14336 4096]
-
blk.37.ffn_gate.weightI32[4096 14336]
-
blk.37.ffn_up.weightI32[4096 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.37.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.37.attn_v.weightQ4_K[4096 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weightI32[14336 4096]
-
blk.38.ffn_gate.weightI32[4096 14336]
-
blk.38.ffn_up.weightI32[4096 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.38.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.38.attn_v.weightQ4_K[4096 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weightI32[14336 4096]
-
blk.39.ffn_gate.weightI32[4096 14336]
-
blk.39.ffn_up.weightI32[4096 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.39.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.39.attn_v.weightQ4_K[4096 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weightI32[14336 4096]
-
blk.40.ffn_gate.weightI32[4096 14336]
-
blk.40.ffn_up.weightI32[4096 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.40.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.40.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.40.attn_v.weightQ4_K[4096 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weightI32[14336 4096]
-
blk.41.ffn_gate.weightI32[4096 14336]
-
blk.41.ffn_up.weightI32[4096 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.41.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.41.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.41.attn_v.weightQ4_K[4096 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weightI32[14336 4096]
-
blk.42.ffn_gate.weightI32[4096 14336]
-
blk.42.ffn_up.weightI32[4096 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.42.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.42.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.42.attn_v.weightQ4_K[4096 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weightI32[14336 4096]
-
blk.43.ffn_gate.weightI32[4096 14336]
-
blk.43.ffn_up.weightI32[4096 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.43.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.43.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.43.attn_v.weightQ4_K[4096 1024]
-
blk.44.ffn_gate.weightI32[4096 14336]
-
blk.44.ffn_up.weightI32[4096 14336]
-
blk.44.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.44.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.44.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.44.attn_v.weightQ4_K[4096 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weightI32[14336 4096]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weightI32[14336 4096]
-
blk.45.ffn_gate.weightI32[4096 14336]
-
blk.45.ffn_up.weightI32[4096 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.45.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.45.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.45.attn_v.weightQ4_K[4096 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weightI32[14336 4096]
-
blk.46.ffn_gate.weightI32[4096 14336]
-
blk.46.ffn_up.weightI32[4096 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.46.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.46.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.46.attn_v.weightQ4_K[4096 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weightI32[14336 4096]
-
blk.47.ffn_gate.weightI32[4096 14336]
-
blk.47.ffn_up.weightI32[4096 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.47.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.47.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.47.attn_v.weightQ4_K[4096 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.ffn_down.weightI32[14336 4096]
-
blk.48.ffn_gate.weightI32[4096 14336]
-
blk.48.ffn_up.weightI32[4096 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.48.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.48.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.48.attn_v.weightQ4_K[4096 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.ffn_down.weightI32[14336 4096]
-
blk.49.ffn_gate.weightI32[4096 14336]
-
blk.49.ffn_up.weightI32[4096 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.attn_k.weight(!unknown_type 22!)[4096 1024]
-
blk.49.attn_output.weight(!unknown_type 21!)[4096 4096]
-
blk.49.attn_q.weight(!unknown_type 22!)[4096 4096]
-
blk.49.attn_v.weightQ4_K[4096 1024]
-
output.weightQ5_K[4096 32128]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49