Quantized version of ise-uiuc/Magicoder-S-DS-6.7B
7B
211 Pulls Updated 6 months ago
beaf8675e2e3 · 4.8GB
-
general.architecturellama
-
general.file_typeQ5_K_M
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
llama.use_parallel_residualtrue
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32014
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modeldeepseek_coder
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ5_K[4096 32256]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ6_K[11008 4096]
-
blk.0.ffn_gate.weightQ5_K[4096 11008]
-
blk.0.ffn_up.weightQ5_K[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ5_K[4096 4096]
-
blk.0.attn_output.weightQ5_K[4096 4096]
-
blk.0.attn_q.weightQ5_K[4096 4096]
-
blk.0.attn_v.weightQ6_K[4096 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ6_K[11008 4096]
-
blk.1.ffn_gate.weightQ5_K[4096 11008]
-
blk.1.ffn_up.weightQ5_K[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ5_K[4096 4096]
-
blk.1.attn_output.weightQ5_K[4096 4096]
-
blk.1.attn_q.weightQ5_K[4096 4096]
-
blk.1.attn_v.weightQ6_K[4096 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ6_K[11008 4096]
-
blk.2.ffn_gate.weightQ5_K[4096 11008]
-
blk.2.ffn_up.weightQ5_K[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ5_K[4096 4096]
-
blk.2.attn_output.weightQ5_K[4096 4096]
-
blk.2.attn_q.weightQ5_K[4096 4096]
-
blk.2.attn_v.weightQ6_K[4096 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ6_K[11008 4096]
-
blk.3.ffn_gate.weightQ5_K[4096 11008]
-
blk.3.ffn_up.weightQ5_K[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ5_K[4096 4096]
-
blk.3.attn_output.weightQ5_K[4096 4096]
-
blk.3.attn_q.weightQ5_K[4096 4096]
-
blk.3.attn_v.weightQ6_K[4096 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ5_K[11008 4096]
-
blk.4.ffn_gate.weightQ5_K[4096 11008]
-
blk.4.ffn_up.weightQ5_K[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ5_K[4096 4096]
-
blk.4.attn_output.weightQ5_K[4096 4096]
-
blk.4.attn_q.weightQ5_K[4096 4096]
-
blk.4.attn_v.weightQ5_K[4096 4096]
-
blk.5.attn_k.weightQ5_K[4096 4096]
-
blk.5.attn_output.weightQ5_K[4096 4096]
-
blk.5.attn_q.weightQ5_K[4096 4096]
-
blk.5.attn_v.weightQ5_K[4096 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ6_K[11008 4096]
-
blk.5.ffn_gate.weightQ5_K[4096 11008]
-
blk.5.ffn_up.weightQ5_K[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ5_K[11008 4096]
-
blk.6.ffn_gate.weightQ5_K[4096 11008]
-
blk.6.ffn_up.weightQ5_K[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ5_K[4096 4096]
-
blk.6.attn_output.weightQ5_K[4096 4096]
-
blk.6.attn_q.weightQ5_K[4096 4096]
-
blk.6.attn_v.weightQ5_K[4096 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ5_K[11008 4096]
-
blk.7.ffn_gate.weightQ5_K[4096 11008]
-
blk.7.ffn_up.weightQ5_K[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ5_K[4096 4096]
-
blk.7.attn_output.weightQ5_K[4096 4096]
-
blk.7.attn_q.weightQ5_K[4096 4096]
-
blk.7.attn_v.weightQ6_K[4096 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ6_K[11008 4096]
-
blk.8.ffn_gate.weightQ5_K[4096 11008]
-
blk.8.ffn_up.weightQ5_K[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ5_K[4096 4096]
-
blk.8.attn_output.weightQ5_K[4096 4096]
-
blk.8.attn_q.weightQ5_K[4096 4096]
-
blk.8.attn_v.weightQ5_K[4096 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ5_K[11008 4096]
-
blk.9.ffn_gate.weightQ5_K[4096 11008]
-
blk.9.ffn_up.weightQ5_K[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ5_K[4096 4096]
-
blk.9.attn_output.weightQ5_K[4096 4096]
-
blk.9.attn_q.weightQ5_K[4096 4096]
-
blk.9.attn_v.weightQ5_K[4096 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ5_K[11008 4096]
-
blk.10.ffn_gate.weightQ5_K[4096 11008]
-
blk.10.ffn_up.weightQ5_K[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ5_K[4096 4096]
-
blk.10.attn_output.weightQ5_K[4096 4096]
-
blk.10.attn_q.weightQ5_K[4096 4096]
-
blk.10.attn_v.weightQ6_K[4096 4096]
-
blk.11.attn_k.weightQ5_K[4096 4096]
-
blk.11.attn_output.weightQ5_K[4096 4096]
-
blk.11.attn_q.weightQ5_K[4096 4096]
-
blk.11.attn_v.weightQ5_K[4096 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ5_K[11008 4096]
-
blk.11.ffn_gate.weightQ5_K[4096 11008]
-
blk.11.ffn_up.weightQ5_K[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ6_K[11008 4096]
-
blk.12.ffn_gate.weightQ5_K[4096 11008]
-
blk.12.ffn_up.weightQ5_K[4096 11008]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weightQ5_K[4096 4096]
-
blk.12.attn_output.weightQ5_K[4096 4096]
-
blk.12.attn_q.weightQ5_K[4096 4096]
-
blk.12.attn_v.weightQ6_K[4096 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ5_K[11008 4096]
-
blk.13.ffn_gate.weightQ5_K[4096 11008]
-
blk.13.ffn_up.weightQ5_K[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ5_K[4096 4096]
-
blk.13.attn_output.weightQ5_K[4096 4096]
-
blk.13.attn_q.weightQ5_K[4096 4096]
-
blk.13.attn_v.weightQ5_K[4096 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ5_K[11008 4096]
-
blk.14.ffn_gate.weightQ5_K[4096 11008]
-
blk.14.ffn_up.weightQ5_K[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ5_K[4096 4096]
-
blk.14.attn_output.weightQ5_K[4096 4096]
-
blk.14.attn_q.weightQ5_K[4096 4096]
-
blk.14.attn_v.weightQ5_K[4096 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ6_K[11008 4096]
-
blk.15.ffn_gate.weightQ5_K[4096 11008]
-
blk.15.ffn_up.weightQ5_K[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ5_K[4096 4096]
-
blk.15.attn_output.weightQ5_K[4096 4096]
-
blk.15.attn_q.weightQ5_K[4096 4096]
-
blk.15.attn_v.weightQ6_K[4096 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ5_K[11008 4096]
-
blk.16.ffn_gate.weightQ5_K[4096 11008]
-
blk.16.ffn_up.weightQ5_K[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ5_K[4096 4096]
-
blk.16.attn_output.weightQ5_K[4096 4096]
-
blk.16.attn_q.weightQ5_K[4096 4096]
-
blk.16.attn_v.weightQ5_K[4096 4096]
-
blk.17.attn_k.weightQ5_K[4096 4096]
-
blk.17.attn_output.weightQ5_K[4096 4096]
-
blk.17.attn_q.weightQ5_K[4096 4096]
-
blk.17.attn_v.weightQ5_K[4096 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ5_K[11008 4096]
-
blk.17.ffn_gate.weightQ5_K[4096 11008]
-
blk.17.ffn_up.weightQ5_K[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ6_K[11008 4096]
-
blk.18.ffn_gate.weightQ5_K[4096 11008]
-
blk.18.ffn_up.weightQ5_K[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ5_K[4096 4096]
-
blk.18.attn_output.weightQ5_K[4096 4096]
-
blk.18.attn_q.weightQ5_K[4096 4096]
-
blk.18.attn_v.weightQ6_K[4096 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ5_K[11008 4096]
-
blk.19.ffn_gate.weightQ5_K[4096 11008]
-
blk.19.ffn_up.weightQ5_K[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ5_K[4096 4096]
-
blk.19.attn_output.weightQ5_K[4096 4096]
-
blk.19.attn_q.weightQ5_K[4096 4096]
-
blk.19.attn_v.weightQ5_K[4096 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ5_K[11008 4096]
-
blk.20.ffn_gate.weightQ5_K[4096 11008]
-
blk.20.ffn_up.weightQ5_K[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ5_K[4096 4096]
-
blk.20.attn_output.weightQ5_K[4096 4096]
-
blk.20.attn_q.weightQ5_K[4096 4096]
-
blk.20.attn_v.weightQ5_K[4096 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ6_K[11008 4096]
-
blk.21.ffn_gate.weightQ5_K[4096 11008]
-
blk.21.ffn_up.weightQ5_K[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ5_K[4096 4096]
-
blk.21.attn_output.weightQ5_K[4096 4096]
-
blk.21.attn_q.weightQ5_K[4096 4096]
-
blk.21.attn_v.weightQ6_K[4096 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ5_K[11008 4096]
-
blk.22.ffn_gate.weightQ5_K[4096 11008]
-
blk.22.ffn_up.weightQ5_K[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ5_K[4096 4096]
-
blk.22.attn_output.weightQ5_K[4096 4096]
-
blk.22.attn_q.weightQ5_K[4096 4096]
-
blk.22.attn_v.weightQ5_K[4096 4096]
-
blk.23.attn_k.weightQ5_K[4096 4096]
-
blk.23.attn_output.weightQ5_K[4096 4096]
-
blk.23.attn_q.weightQ5_K[4096 4096]
-
blk.23.attn_v.weightQ5_K[4096 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ5_K[11008 4096]
-
blk.23.ffn_gate.weightQ5_K[4096 11008]
-
blk.23.ffn_up.weightQ5_K[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ6_K[11008 4096]
-
blk.24.ffn_gate.weightQ5_K[4096 11008]
-
blk.24.ffn_up.weightQ5_K[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ5_K[4096 4096]
-
blk.24.attn_output.weightQ5_K[4096 4096]
-
blk.24.attn_q.weightQ5_K[4096 4096]
-
blk.24.attn_v.weightQ6_K[4096 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ5_K[11008 4096]
-
blk.25.ffn_gate.weightQ5_K[4096 11008]
-
blk.25.ffn_up.weightQ5_K[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ5_K[4096 4096]
-
blk.25.attn_output.weightQ5_K[4096 4096]
-
blk.25.attn_q.weightQ5_K[4096 4096]
-
blk.25.attn_v.weightQ5_K[4096 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ5_K[11008 4096]
-
blk.26.ffn_gate.weightQ5_K[4096 11008]
-
blk.26.ffn_up.weightQ5_K[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ5_K[4096 4096]
-
blk.26.attn_output.weightQ5_K[4096 4096]
-
blk.26.attn_q.weightQ5_K[4096 4096]
-
blk.26.attn_v.weightQ5_K[4096 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ6_K[11008 4096]
-
blk.27.ffn_gate.weightQ5_K[4096 11008]
-
blk.27.ffn_up.weightQ5_K[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weightQ5_K[4096 4096]
-
blk.27.attn_output.weightQ5_K[4096 4096]
-
blk.27.attn_q.weightQ5_K[4096 4096]
-
blk.27.attn_v.weightQ6_K[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ6_K[11008 4096]
-
blk.28.ffn_gate.weightQ5_K[4096 11008]
-
blk.28.ffn_up.weightQ5_K[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ5_K[4096 4096]
-
blk.28.attn_output.weightQ5_K[4096 4096]
-
blk.28.attn_q.weightQ5_K[4096 4096]
-
blk.28.attn_v.weightQ6_K[4096 4096]
-
blk.29.attn_k.weightQ5_K[4096 4096]
-
blk.29.attn_output.weightQ5_K[4096 4096]
-
blk.29.attn_q.weightQ5_K[4096 4096]
-
blk.29.attn_v.weightQ6_K[4096 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ6_K[11008 4096]
-
blk.29.ffn_gate.weightQ5_K[4096 11008]
-
blk.29.ffn_up.weightQ5_K[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ6_K[11008 4096]
-
blk.30.ffn_gate.weightQ5_K[4096 11008]
-
blk.30.ffn_up.weightQ5_K[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ5_K[4096 4096]
-
blk.30.attn_output.weightQ5_K[4096 4096]
-
blk.30.attn_q.weightQ5_K[4096 4096]
-
blk.30.attn_v.weightQ6_K[4096 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ6_K[11008 4096]
-
blk.31.ffn_gate.weightQ5_K[4096 11008]
-
blk.31.ffn_up.weightQ5_K[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ5_K[4096 4096]
-
blk.31.attn_output.weightQ5_K[4096 4096]
-
blk.31.attn_q.weightQ5_K[4096 4096]
-
blk.31.attn_v.weightQ6_K[4096 4096]
-
output.weightQ6_K[4096 32256]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31