With correct 16k context window
33B
73 Pulls Updated 3 months ago
5ef15ed56c4d · 5.5GB
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32014
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ6_K[4096 32256]
-
blk.0.attn_q.weightQ6_K[4096 4096]
-
blk.0.attn_k.weightQ6_K[4096 4096]
-
blk.0.attn_v.weightQ6_K[4096 4096]
-
blk.0.attn_output.weightQ6_K[4096 4096]
-
blk.0.ffn_gate.weightQ6_K[4096 11008]
-
blk.0.ffn_up.weightQ6_K[4096 11008]
-
blk.0.ffn_down.weightQ6_K[11008 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.1.attn_q.weightQ6_K[4096 4096]
-
blk.1.attn_k.weightQ6_K[4096 4096]
-
blk.1.attn_v.weightQ6_K[4096 4096]
-
blk.1.attn_output.weightQ6_K[4096 4096]
-
blk.1.ffn_gate.weightQ6_K[4096 11008]
-
blk.1.ffn_up.weightQ6_K[4096 11008]
-
blk.1.ffn_down.weightQ6_K[11008 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.2.attn_q.weightQ6_K[4096 4096]
-
blk.2.attn_k.weightQ6_K[4096 4096]
-
blk.2.attn_v.weightQ6_K[4096 4096]
-
blk.2.attn_output.weightQ6_K[4096 4096]
-
blk.2.ffn_gate.weightQ6_K[4096 11008]
-
blk.2.ffn_up.weightQ6_K[4096 11008]
-
blk.2.ffn_down.weightQ6_K[11008 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.3.attn_q.weightQ6_K[4096 4096]
-
blk.3.attn_k.weightQ6_K[4096 4096]
-
blk.3.attn_v.weightQ6_K[4096 4096]
-
blk.3.attn_output.weightQ6_K[4096 4096]
-
blk.3.ffn_gate.weightQ6_K[4096 11008]
-
blk.3.ffn_up.weightQ6_K[4096 11008]
-
blk.3.ffn_down.weightQ6_K[11008 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.4.attn_q.weightQ6_K[4096 4096]
-
blk.4.attn_k.weightQ6_K[4096 4096]
-
blk.4.attn_v.weightQ6_K[4096 4096]
-
blk.4.attn_output.weightQ6_K[4096 4096]
-
blk.4.ffn_gate.weightQ6_K[4096 11008]
-
blk.4.ffn_up.weightQ6_K[4096 11008]
-
blk.4.ffn_down.weightQ6_K[11008 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.5.attn_q.weightQ6_K[4096 4096]
-
blk.5.attn_k.weightQ6_K[4096 4096]
-
blk.5.attn_v.weightQ6_K[4096 4096]
-
blk.5.attn_output.weightQ6_K[4096 4096]
-
blk.5.ffn_gate.weightQ6_K[4096 11008]
-
blk.5.ffn_up.weightQ6_K[4096 11008]
-
blk.5.ffn_down.weightQ6_K[11008 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_q.weightQ6_K[4096 4096]
-
blk.6.attn_k.weightQ6_K[4096 4096]
-
blk.6.attn_v.weightQ6_K[4096 4096]
-
blk.6.attn_output.weightQ6_K[4096 4096]
-
blk.6.ffn_gate.weightQ6_K[4096 11008]
-
blk.6.ffn_up.weightQ6_K[4096 11008]
-
blk.6.ffn_down.weightQ6_K[11008 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.7.attn_q.weightQ6_K[4096 4096]
-
blk.7.attn_k.weightQ6_K[4096 4096]
-
blk.7.attn_v.weightQ6_K[4096 4096]
-
blk.7.attn_output.weightQ6_K[4096 4096]
-
blk.7.ffn_gate.weightQ6_K[4096 11008]
-
blk.7.ffn_up.weightQ6_K[4096 11008]
-
blk.7.ffn_down.weightQ6_K[11008 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.8.attn_q.weightQ6_K[4096 4096]
-
blk.8.attn_k.weightQ6_K[4096 4096]
-
blk.8.attn_v.weightQ6_K[4096 4096]
-
blk.8.attn_output.weightQ6_K[4096 4096]
-
blk.8.ffn_gate.weightQ6_K[4096 11008]
-
blk.8.ffn_up.weightQ6_K[4096 11008]
-
blk.8.ffn_down.weightQ6_K[11008 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.9.attn_q.weightQ6_K[4096 4096]
-
blk.9.attn_k.weightQ6_K[4096 4096]
-
blk.9.attn_v.weightQ6_K[4096 4096]
-
blk.9.attn_output.weightQ6_K[4096 4096]
-
blk.9.ffn_gate.weightQ6_K[4096 11008]
-
blk.9.ffn_up.weightQ6_K[4096 11008]
-
blk.9.ffn_down.weightQ6_K[11008 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.10.attn_q.weightQ6_K[4096 4096]
-
blk.10.attn_k.weightQ6_K[4096 4096]
-
blk.10.attn_v.weightQ6_K[4096 4096]
-
blk.10.attn_output.weightQ6_K[4096 4096]
-
blk.10.ffn_gate.weightQ6_K[4096 11008]
-
blk.10.ffn_up.weightQ6_K[4096 11008]
-
blk.10.ffn_down.weightQ6_K[11008 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_q.weightQ6_K[4096 4096]
-
blk.11.attn_k.weightQ6_K[4096 4096]
-
blk.11.attn_v.weightQ6_K[4096 4096]
-
blk.11.attn_output.weightQ6_K[4096 4096]
-
blk.11.ffn_gate.weightQ6_K[4096 11008]
-
blk.11.ffn_up.weightQ6_K[4096 11008]
-
blk.11.ffn_down.weightQ6_K[11008 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_q.weightQ6_K[4096 4096]
-
blk.12.attn_k.weightQ6_K[4096 4096]
-
blk.12.attn_v.weightQ6_K[4096 4096]
-
blk.12.attn_output.weightQ6_K[4096 4096]
-
blk.12.ffn_gate.weightQ6_K[4096 11008]
-
blk.12.ffn_up.weightQ6_K[4096 11008]
-
blk.12.ffn_down.weightQ6_K[11008 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_q.weightQ6_K[4096 4096]
-
blk.13.attn_k.weightQ6_K[4096 4096]
-
blk.13.attn_v.weightQ6_K[4096 4096]
-
blk.13.attn_output.weightQ6_K[4096 4096]
-
blk.13.ffn_gate.weightQ6_K[4096 11008]
-
blk.13.ffn_up.weightQ6_K[4096 11008]
-
blk.13.ffn_down.weightQ6_K[11008 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.14.attn_q.weightQ6_K[4096 4096]
-
blk.14.attn_k.weightQ6_K[4096 4096]
-
blk.14.attn_v.weightQ6_K[4096 4096]
-
blk.14.attn_output.weightQ6_K[4096 4096]
-
blk.14.ffn_gate.weightQ6_K[4096 11008]
-
blk.14.ffn_up.weightQ6_K[4096 11008]
-
blk.14.ffn_down.weightQ6_K[11008 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.15.attn_q.weightQ6_K[4096 4096]
-
blk.15.attn_k.weightQ6_K[4096 4096]
-
blk.15.attn_v.weightQ6_K[4096 4096]
-
blk.15.attn_output.weightQ6_K[4096 4096]
-
blk.15.ffn_gate.weightQ6_K[4096 11008]
-
blk.15.ffn_up.weightQ6_K[4096 11008]
-
blk.15.ffn_down.weightQ6_K[11008 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.16.attn_q.weightQ6_K[4096 4096]
-
blk.16.attn_k.weightQ6_K[4096 4096]
-
blk.16.attn_v.weightQ6_K[4096 4096]
-
blk.16.attn_output.weightQ6_K[4096 4096]
-
blk.16.ffn_gate.weightQ6_K[4096 11008]
-
blk.16.ffn_up.weightQ6_K[4096 11008]
-
blk.16.ffn_down.weightQ6_K[11008 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.17.attn_q.weightQ6_K[4096 4096]
-
blk.17.attn_k.weightQ6_K[4096 4096]
-
blk.17.attn_v.weightQ6_K[4096 4096]
-
blk.17.attn_output.weightQ6_K[4096 4096]
-
blk.17.ffn_gate.weightQ6_K[4096 11008]
-
blk.17.ffn_up.weightQ6_K[4096 11008]
-
blk.17.ffn_down.weightQ6_K[11008 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_q.weightQ6_K[4096 4096]
-
blk.18.attn_k.weightQ6_K[4096 4096]
-
blk.18.attn_v.weightQ6_K[4096 4096]
-
blk.18.attn_output.weightQ6_K[4096 4096]
-
blk.18.ffn_gate.weightQ6_K[4096 11008]
-
blk.18.ffn_up.weightQ6_K[4096 11008]
-
blk.18.ffn_down.weightQ6_K[11008 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.19.attn_q.weightQ6_K[4096 4096]
-
blk.19.attn_k.weightQ6_K[4096 4096]
-
blk.19.attn_v.weightQ6_K[4096 4096]
-
blk.19.attn_output.weightQ6_K[4096 4096]
-
blk.19.ffn_gate.weightQ6_K[4096 11008]
-
blk.19.ffn_up.weightQ6_K[4096 11008]
-
blk.19.ffn_down.weightQ6_K[11008 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.20.attn_q.weightQ6_K[4096 4096]
-
blk.20.attn_k.weightQ6_K[4096 4096]
-
blk.20.attn_v.weightQ6_K[4096 4096]
-
blk.20.attn_output.weightQ6_K[4096 4096]
-
blk.20.ffn_gate.weightQ6_K[4096 11008]
-
blk.20.ffn_up.weightQ6_K[4096 11008]
-
blk.20.ffn_down.weightQ6_K[11008 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.21.attn_q.weightQ6_K[4096 4096]
-
blk.21.attn_k.weightQ6_K[4096 4096]
-
blk.21.attn_v.weightQ6_K[4096 4096]
-
blk.21.attn_output.weightQ6_K[4096 4096]
-
blk.21.ffn_gate.weightQ6_K[4096 11008]
-
blk.21.ffn_up.weightQ6_K[4096 11008]
-
blk.21.ffn_down.weightQ6_K[11008 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.22.attn_q.weightQ6_K[4096 4096]
-
blk.22.attn_k.weightQ6_K[4096 4096]
-
blk.22.attn_v.weightQ6_K[4096 4096]
-
blk.22.attn_output.weightQ6_K[4096 4096]
-
blk.22.ffn_gate.weightQ6_K[4096 11008]
-
blk.22.ffn_up.weightQ6_K[4096 11008]
-
blk.22.ffn_down.weightQ6_K[11008 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_q.weightQ6_K[4096 4096]
-
blk.23.attn_k.weightQ6_K[4096 4096]
-
blk.23.attn_v.weightQ6_K[4096 4096]
-
blk.23.attn_output.weightQ6_K[4096 4096]
-
blk.23.ffn_gate.weightQ6_K[4096 11008]
-
blk.23.ffn_up.weightQ6_K[4096 11008]
-
blk.23.ffn_down.weightQ6_K[11008 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_q.weightQ6_K[4096 4096]
-
blk.24.attn_k.weightQ6_K[4096 4096]
-
blk.24.attn_v.weightQ6_K[4096 4096]
-
blk.24.attn_output.weightQ6_K[4096 4096]
-
blk.24.ffn_gate.weightQ6_K[4096 11008]
-
blk.24.ffn_up.weightQ6_K[4096 11008]
-
blk.24.ffn_down.weightQ6_K[11008 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.25.attn_q.weightQ6_K[4096 4096]
-
blk.25.attn_k.weightQ6_K[4096 4096]
-
blk.25.attn_v.weightQ6_K[4096 4096]
-
blk.25.attn_output.weightQ6_K[4096 4096]
-
blk.25.ffn_gate.weightQ6_K[4096 11008]
-
blk.25.ffn_up.weightQ6_K[4096 11008]
-
blk.25.ffn_down.weightQ6_K[11008 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.26.attn_q.weightQ6_K[4096 4096]
-
blk.26.attn_k.weightQ6_K[4096 4096]
-
blk.26.attn_v.weightQ6_K[4096 4096]
-
blk.26.attn_output.weightQ6_K[4096 4096]
-
blk.26.ffn_gate.weightQ6_K[4096 11008]
-
blk.26.ffn_up.weightQ6_K[4096 11008]
-
blk.26.ffn_down.weightQ6_K[11008 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.27.attn_q.weightQ6_K[4096 4096]
-
blk.27.attn_k.weightQ6_K[4096 4096]
-
blk.27.attn_v.weightQ6_K[4096 4096]
-
blk.27.attn_output.weightQ6_K[4096 4096]
-
blk.27.ffn_gate.weightQ6_K[4096 11008]
-
blk.27.ffn_up.weightQ6_K[4096 11008]
-
blk.27.ffn_down.weightQ6_K[11008 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.28.attn_q.weightQ6_K[4096 4096]
-
blk.28.attn_k.weightQ6_K[4096 4096]
-
blk.28.attn_v.weightQ6_K[4096 4096]
-
blk.28.attn_output.weightQ6_K[4096 4096]
-
blk.28.ffn_gate.weightQ6_K[4096 11008]
-
blk.28.ffn_up.weightQ6_K[4096 11008]
-
blk.28.ffn_down.weightQ6_K[11008 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.29.attn_q.weightQ6_K[4096 4096]
-
blk.29.attn_k.weightQ6_K[4096 4096]
-
blk.29.attn_v.weightQ6_K[4096 4096]
-
blk.29.attn_output.weightQ6_K[4096 4096]
-
blk.29.ffn_gate.weightQ6_K[4096 11008]
-
blk.29.ffn_up.weightQ6_K[4096 11008]
-
blk.29.ffn_down.weightQ6_K[11008 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_q.weightQ6_K[4096 4096]
-
blk.30.attn_k.weightQ6_K[4096 4096]
-
blk.30.attn_v.weightQ6_K[4096 4096]
-
blk.30.attn_output.weightQ6_K[4096 4096]
-
blk.30.ffn_gate.weightQ6_K[4096 11008]
-
blk.30.ffn_up.weightQ6_K[4096 11008]
-
blk.30.ffn_down.weightQ6_K[11008 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.31.attn_q.weightQ6_K[4096 4096]
-
blk.31.attn_k.weightQ6_K[4096 4096]
-
blk.31.attn_v.weightQ6_K[4096 4096]
-
blk.31.attn_output.weightQ6_K[4096 4096]
-
blk.31.ffn_gate.weightQ6_K[4096 11008]
-
blk.31.ffn_up.weightQ6_K[4096 11008]
-
blk.31.ffn_down.weightQ6_K[11008 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_norm.weightF32[4096]
-
output_norm.weightF32[4096]
-
output.weightQ6_K[4096 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31