latest
3.7GB
trendyol-llm-7b-chat-v0.1.Q3_K_L.gguf
7B
3 Pulls Updated 2 months ago
c7d607d5eeca · 3.7GB
-
general.architecturellama
-
general.file_typeQ3_K_L
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length4096
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
NameTypeShape
-
token_embd.weightQ3_K[4096 44222]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ5_K[11008 4096]
-
blk.0.ffn_gate.weightQ3_K[4096 11008]
-
blk.0.ffn_up.weightQ3_K[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ3_K[4096 4096]
-
blk.0.attn_output.weightQ5_K[4096 4096]
-
blk.0.attn_q.weightQ3_K[4096 4096]
-
blk.0.attn_v.weightQ5_K[4096 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ5_K[11008 4096]
-
blk.1.ffn_gate.weightQ3_K[4096 11008]
-
blk.1.ffn_up.weightQ3_K[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ3_K[4096 4096]
-
blk.1.attn_output.weightQ5_K[4096 4096]
-
blk.1.attn_q.weightQ3_K[4096 4096]
-
blk.1.attn_v.weightQ5_K[4096 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ5_K[11008 4096]
-
blk.2.ffn_gate.weightQ3_K[4096 11008]
-
blk.2.ffn_up.weightQ3_K[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ3_K[4096 4096]
-
blk.2.attn_output.weightQ5_K[4096 4096]
-
blk.2.attn_q.weightQ3_K[4096 4096]
-
blk.2.attn_v.weightQ5_K[4096 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ5_K[11008 4096]
-
blk.3.ffn_gate.weightQ3_K[4096 11008]
-
blk.3.ffn_up.weightQ3_K[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ3_K[4096 4096]
-
blk.3.attn_output.weightQ5_K[4096 4096]
-
blk.3.attn_q.weightQ3_K[4096 4096]
-
blk.3.attn_v.weightQ5_K[4096 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ5_K[11008 4096]
-
blk.4.ffn_gate.weightQ3_K[4096 11008]
-
blk.4.ffn_up.weightQ3_K[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ3_K[4096 4096]
-
blk.4.attn_output.weightQ5_K[4096 4096]
-
blk.4.attn_q.weightQ3_K[4096 4096]
-
blk.4.attn_v.weightQ5_K[4096 4096]
-
blk.5.attn_k.weightQ3_K[4096 4096]
-
blk.5.attn_q.weightQ3_K[4096 4096]
-
blk.5.attn_v.weightQ5_K[4096 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ5_K[11008 4096]
-
blk.5.ffn_gate.weightQ3_K[4096 11008]
-
blk.5.ffn_up.weightQ3_K[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_output.weightQ5_K[4096 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ5_K[11008 4096]
-
blk.6.ffn_gate.weightQ3_K[4096 11008]
-
blk.6.ffn_up.weightQ3_K[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ3_K[4096 4096]
-
blk.6.attn_output.weightQ5_K[4096 4096]
-
blk.6.attn_q.weightQ3_K[4096 4096]
-
blk.6.attn_v.weightQ5_K[4096 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ5_K[11008 4096]
-
blk.7.ffn_gate.weightQ3_K[4096 11008]
-
blk.7.ffn_up.weightQ3_K[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ3_K[4096 4096]
-
blk.7.attn_output.weightQ5_K[4096 4096]
-
blk.7.attn_q.weightQ3_K[4096 4096]
-
blk.7.attn_v.weightQ5_K[4096 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ5_K[11008 4096]
-
blk.8.ffn_gate.weightQ3_K[4096 11008]
-
blk.8.ffn_up.weightQ3_K[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ3_K[4096 4096]
-
blk.8.attn_output.weightQ5_K[4096 4096]
-
blk.8.attn_q.weightQ3_K[4096 4096]
-
blk.8.attn_v.weightQ5_K[4096 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ5_K[11008 4096]
-
blk.9.ffn_gate.weightQ3_K[4096 11008]
-
blk.9.ffn_up.weightQ3_K[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ3_K[4096 4096]
-
blk.9.attn_output.weightQ5_K[4096 4096]
-
blk.9.attn_q.weightQ3_K[4096 4096]
-
blk.9.attn_v.weightQ5_K[4096 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ5_K[11008 4096]
-
blk.10.ffn_gate.weightQ3_K[4096 11008]
-
blk.10.ffn_up.weightQ3_K[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ3_K[4096 4096]
-
blk.10.attn_output.weightQ5_K[4096 4096]
-
blk.10.attn_q.weightQ3_K[4096 4096]
-
blk.10.attn_v.weightQ5_K[4096 4096]
-
blk.11.attn_k.weightQ3_K[4096 4096]
-
blk.11.attn_output.weightQ5_K[4096 4096]
-
blk.11.attn_q.weightQ3_K[4096 4096]
-
blk.11.attn_v.weightQ5_K[4096 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ5_K[11008 4096]
-
blk.11.ffn_gate.weightQ3_K[4096 11008]
-
blk.11.ffn_up.weightQ3_K[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ5_K[11008 4096]
-
blk.12.ffn_gate.weightQ3_K[4096 11008]
-
blk.12.ffn_up.weightQ3_K[4096 11008]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weightQ3_K[4096 4096]
-
blk.12.attn_output.weightQ5_K[4096 4096]
-
blk.12.attn_q.weightQ3_K[4096 4096]
-
blk.12.attn_v.weightQ5_K[4096 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ5_K[11008 4096]
-
blk.13.ffn_gate.weightQ3_K[4096 11008]
-
blk.13.ffn_up.weightQ3_K[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ3_K[4096 4096]
-
blk.13.attn_output.weightQ5_K[4096 4096]
-
blk.13.attn_q.weightQ3_K[4096 4096]
-
blk.13.attn_v.weightQ5_K[4096 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ5_K[11008 4096]
-
blk.14.ffn_gate.weightQ3_K[4096 11008]
-
blk.14.ffn_up.weightQ3_K[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ3_K[4096 4096]
-
blk.14.attn_output.weightQ5_K[4096 4096]
-
blk.14.attn_q.weightQ3_K[4096 4096]
-
blk.14.attn_v.weightQ5_K[4096 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ5_K[11008 4096]
-
blk.15.ffn_gate.weightQ3_K[4096 11008]
-
blk.15.ffn_up.weightQ3_K[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ3_K[4096 4096]
-
blk.15.attn_output.weightQ5_K[4096 4096]
-
blk.15.attn_q.weightQ3_K[4096 4096]
-
blk.15.attn_v.weightQ5_K[4096 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ5_K[11008 4096]
-
blk.16.ffn_gate.weightQ3_K[4096 11008]
-
blk.16.ffn_up.weightQ3_K[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ3_K[4096 4096]
-
blk.16.attn_output.weightQ5_K[4096 4096]
-
blk.16.attn_q.weightQ3_K[4096 4096]
-
blk.16.attn_v.weightQ5_K[4096 4096]
-
blk.17.attn_k.weightQ3_K[4096 4096]
-
blk.17.attn_output.weightQ5_K[4096 4096]
-
blk.17.attn_q.weightQ3_K[4096 4096]
-
blk.17.attn_v.weightQ5_K[4096 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ5_K[11008 4096]
-
blk.17.ffn_gate.weightQ3_K[4096 11008]
-
blk.17.ffn_up.weightQ3_K[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ5_K[11008 4096]
-
blk.18.ffn_gate.weightQ3_K[4096 11008]
-
blk.18.ffn_up.weightQ3_K[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ3_K[4096 4096]
-
blk.18.attn_output.weightQ5_K[4096 4096]
-
blk.18.attn_q.weightQ3_K[4096 4096]
-
blk.18.attn_v.weightQ5_K[4096 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ5_K[11008 4096]
-
blk.19.ffn_gate.weightQ3_K[4096 11008]
-
blk.19.ffn_up.weightQ3_K[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ3_K[4096 4096]
-
blk.19.attn_output.weightQ5_K[4096 4096]
-
blk.19.attn_q.weightQ3_K[4096 4096]
-
blk.19.attn_v.weightQ5_K[4096 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ5_K[11008 4096]
-
blk.20.ffn_gate.weightQ3_K[4096 11008]
-
blk.20.ffn_up.weightQ3_K[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ3_K[4096 4096]
-
blk.20.attn_output.weightQ5_K[4096 4096]
-
blk.20.attn_q.weightQ3_K[4096 4096]
-
blk.20.attn_v.weightQ5_K[4096 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ5_K[11008 4096]
-
blk.21.ffn_gate.weightQ3_K[4096 11008]
-
blk.21.ffn_up.weightQ3_K[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ3_K[4096 4096]
-
blk.21.attn_output.weightQ5_K[4096 4096]
-
blk.21.attn_q.weightQ3_K[4096 4096]
-
blk.21.attn_v.weightQ5_K[4096 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ5_K[11008 4096]
-
blk.22.ffn_gate.weightQ3_K[4096 11008]
-
blk.22.ffn_up.weightQ3_K[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ3_K[4096 4096]
-
blk.22.attn_output.weightQ5_K[4096 4096]
-
blk.22.attn_q.weightQ3_K[4096 4096]
-
blk.22.attn_v.weightQ5_K[4096 4096]
-
blk.23.attn_k.weightQ3_K[4096 4096]
-
blk.23.attn_output.weightQ5_K[4096 4096]
-
blk.23.attn_q.weightQ3_K[4096 4096]
-
blk.23.attn_v.weightQ5_K[4096 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ5_K[11008 4096]
-
blk.23.ffn_gate.weightQ3_K[4096 11008]
-
blk.23.ffn_up.weightQ3_K[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ5_K[11008 4096]
-
blk.24.ffn_gate.weightQ3_K[4096 11008]
-
blk.24.ffn_up.weightQ3_K[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ3_K[4096 4096]
-
blk.24.attn_output.weightQ5_K[4096 4096]
-
blk.24.attn_q.weightQ3_K[4096 4096]
-
blk.24.attn_v.weightQ5_K[4096 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ5_K[11008 4096]
-
blk.25.ffn_gate.weightQ3_K[4096 11008]
-
blk.25.ffn_up.weightQ3_K[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ3_K[4096 4096]
-
blk.25.attn_output.weightQ5_K[4096 4096]
-
blk.25.attn_q.weightQ3_K[4096 4096]
-
blk.25.attn_v.weightQ5_K[4096 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ5_K[11008 4096]
-
blk.26.ffn_gate.weightQ3_K[4096 11008]
-
blk.26.ffn_up.weightQ3_K[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ3_K[4096 4096]
-
blk.26.attn_output.weightQ5_K[4096 4096]
-
blk.26.attn_q.weightQ3_K[4096 4096]
-
blk.26.attn_v.weightQ5_K[4096 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ5_K[11008 4096]
-
blk.27.ffn_gate.weightQ3_K[4096 11008]
-
blk.27.ffn_up.weightQ3_K[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weightQ3_K[4096 4096]
-
blk.27.attn_output.weightQ5_K[4096 4096]
-
blk.27.attn_q.weightQ3_K[4096 4096]
-
blk.27.attn_v.weightQ5_K[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ5_K[11008 4096]
-
blk.28.ffn_gate.weightQ3_K[4096 11008]
-
blk.28.ffn_up.weightQ3_K[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ3_K[4096 4096]
-
blk.28.attn_output.weightQ5_K[4096 4096]
-
blk.28.attn_q.weightQ3_K[4096 4096]
-
blk.28.attn_v.weightQ5_K[4096 4096]
-
blk.29.attn_k.weightQ3_K[4096 4096]
-
blk.29.attn_output.weightQ5_K[4096 4096]
-
blk.29.attn_q.weightQ3_K[4096 4096]
-
blk.29.attn_v.weightQ5_K[4096 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ5_K[11008 4096]
-
blk.29.ffn_gate.weightQ3_K[4096 11008]
-
blk.29.ffn_up.weightQ3_K[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ5_K[11008 4096]
-
blk.30.ffn_gate.weightQ3_K[4096 11008]
-
blk.30.ffn_up.weightQ3_K[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ3_K[4096 4096]
-
blk.30.attn_output.weightQ5_K[4096 4096]
-
blk.30.attn_q.weightQ3_K[4096 4096]
-
blk.30.attn_v.weightQ5_K[4096 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ5_K[11008 4096]
-
blk.31.ffn_gate.weightQ3_K[4096 11008]
-
blk.31.ffn_up.weightQ3_K[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ3_K[4096 4096]
-
blk.31.attn_output.weightQ5_K[4096 4096]
-
blk.31.attn_q.weightQ3_K[4096 4096]
-
blk.31.attn_v.weightQ5_K[4096 4096]
-
output.weightQ6_K[4096 44222]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31