3b
1.7GB
39 Pulls Updated 6 months ago
31b41fd17357 · 1.7GB
-
general.architecturestablelm
-
general.file_typeQ4_K_M
-
stablelm.attention.head_count32
-
stablelm.attention.layer_norm_epsilon1e-05
-
stablelm.block_count32
-
stablelm.context_length16384
-
stablelm.embedding_length2560
-
stablelm.feed_forward_length6912
-
stablelm.rope.dimension_count20
-
stablelm.use_parallel_residualtrue
-
tokenizer.ggml.bos_token_id0
-
tokenizer.ggml.eos_token_id0
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a h e i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.token_type[3 3 1 1 1 ...]
-
tokenizer.ggml.tokens[<|endoftext|> <|padding|> ! " # ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[2560 50304]
-
blk.0.attn_norm.biasF32[2560]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_down.weightQ6_K[6912 2560]
-
blk.0.ffn_gate.weightQ4_K[2560 6912]
-
blk.0.ffn_up.weightQ4_K[2560 6912]
-
blk.0.ffn_norm.biasF32[2560]
-
blk.0.ffn_norm.weightF32[2560]
-
blk.0.attn_k.weightQ4_K[2560 2560]
-
blk.0.attn_output.weightQ4_K[2560 2560]
-
blk.0.attn_q.weightQ4_K[2560 2560]
-
blk.0.attn_v.weightQ6_K[2560 2560]
-
blk.1.attn_norm.biasF32[2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_down.weightQ6_K[6912 2560]
-
blk.1.ffn_gate.weightQ4_K[2560 6912]
-
blk.1.ffn_up.weightQ4_K[2560 6912]
-
blk.1.ffn_norm.biasF32[2560]
-
blk.1.ffn_norm.weightF32[2560]
-
blk.1.attn_k.weightQ4_K[2560 2560]
-
blk.1.attn_output.weightQ4_K[2560 2560]
-
blk.1.attn_q.weightQ4_K[2560 2560]
-
blk.1.attn_v.weightQ6_K[2560 2560]
-
blk.2.attn_norm.biasF32[2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_down.weightQ6_K[6912 2560]
-
blk.2.ffn_gate.weightQ4_K[2560 6912]
-
blk.2.ffn_up.weightQ4_K[2560 6912]
-
blk.2.ffn_norm.biasF32[2560]
-
blk.2.ffn_norm.weightF32[2560]
-
blk.2.attn_k.weightQ4_K[2560 2560]
-
blk.2.attn_output.weightQ4_K[2560 2560]
-
blk.2.attn_q.weightQ4_K[2560 2560]
-
blk.2.attn_v.weightQ6_K[2560 2560]
-
blk.3.attn_norm.biasF32[2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_down.weightQ4_K[6912 2560]
-
blk.3.ffn_gate.weightQ4_K[2560 6912]
-
blk.3.ffn_up.weightQ4_K[2560 6912]
-
blk.3.ffn_norm.biasF32[2560]
-
blk.3.ffn_norm.weightF32[2560]
-
blk.3.attn_k.weightQ4_K[2560 2560]
-
blk.3.attn_output.weightQ4_K[2560 2560]
-
blk.3.attn_q.weightQ4_K[2560 2560]
-
blk.3.attn_v.weightQ4_K[2560 2560]
-
blk.4.attn_norm.biasF32[2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_down.weightQ4_K[6912 2560]
-
blk.4.ffn_gate.weightQ4_K[2560 6912]
-
blk.4.ffn_up.weightQ4_K[2560 6912]
-
blk.4.ffn_norm.biasF32[2560]
-
blk.4.ffn_norm.weightF32[2560]
-
blk.4.attn_k.weightQ4_K[2560 2560]
-
blk.4.attn_output.weightQ4_K[2560 2560]
-
blk.4.attn_q.weightQ4_K[2560 2560]
-
blk.4.attn_v.weightQ6_K[2560 2560]
-
blk.5.attn_norm.biasF32[2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_down.weightQ6_K[6912 2560]
-
blk.5.ffn_gate.weightQ4_K[2560 6912]
-
blk.5.ffn_up.weightQ4_K[2560 6912]
-
blk.5.ffn_norm.biasF32[2560]
-
blk.5.ffn_norm.weightF32[2560]
-
blk.5.attn_k.weightQ4_K[2560 2560]
-
blk.5.attn_output.weightQ4_K[2560 2560]
-
blk.5.attn_q.weightQ4_K[2560 2560]
-
blk.5.attn_v.weightQ4_K[2560 2560]
-
blk.6.attn_norm.biasF32[2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_down.weightQ4_K[6912 2560]
-
blk.6.ffn_gate.weightQ4_K[2560 6912]
-
blk.6.ffn_up.weightQ4_K[2560 6912]
-
blk.6.ffn_norm.biasF32[2560]
-
blk.6.ffn_norm.weightF32[2560]
-
blk.6.attn_k.weightQ4_K[2560 2560]
-
blk.6.attn_output.weightQ4_K[2560 2560]
-
blk.6.attn_q.weightQ4_K[2560 2560]
-
blk.6.attn_v.weightQ4_K[2560 2560]
-
blk.7.attn_norm.biasF32[2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_down.weightQ4_K[6912 2560]
-
blk.7.ffn_gate.weightQ4_K[2560 6912]
-
blk.7.ffn_up.weightQ4_K[2560 6912]
-
blk.7.ffn_norm.biasF32[2560]
-
blk.7.ffn_norm.weightF32[2560]
-
blk.7.attn_k.weightQ4_K[2560 2560]
-
blk.7.attn_output.weightQ4_K[2560 2560]
-
blk.7.attn_q.weightQ4_K[2560 2560]
-
blk.7.attn_v.weightQ6_K[2560 2560]
-
blk.8.attn_norm.biasF32[2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_down.weightQ6_K[6912 2560]
-
blk.8.ffn_gate.weightQ4_K[2560 6912]
-
blk.8.ffn_up.weightQ4_K[2560 6912]
-
blk.8.ffn_norm.biasF32[2560]
-
blk.8.ffn_norm.weightF32[2560]
-
blk.8.attn_k.weightQ4_K[2560 2560]
-
blk.8.attn_output.weightQ4_K[2560 2560]
-
blk.8.attn_q.weightQ4_K[2560 2560]
-
blk.8.attn_v.weightQ6_K[2560 2560]
-
blk.9.attn_norm.biasF32[2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_down.weightQ6_K[6912 2560]
-
blk.9.ffn_gate.weightQ4_K[2560 6912]
-
blk.9.ffn_up.weightQ4_K[2560 6912]
-
blk.9.ffn_norm.biasF32[2560]
-
blk.9.ffn_norm.weightF32[2560]
-
blk.9.attn_k.weightQ4_K[2560 2560]
-
blk.9.attn_output.weightQ4_K[2560 2560]
-
blk.9.attn_q.weightQ4_K[2560 2560]
-
blk.9.attn_v.weightQ6_K[2560 2560]
-
blk.10.attn_norm.biasF32[2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_down.weightQ6_K[6912 2560]
-
blk.10.ffn_gate.weightQ4_K[2560 6912]
-
blk.10.ffn_up.weightQ4_K[2560 6912]
-
blk.10.ffn_norm.biasF32[2560]
-
blk.10.ffn_norm.weightF32[2560]
-
blk.10.attn_k.weightQ4_K[2560 2560]
-
blk.10.attn_output.weightQ4_K[2560 2560]
-
blk.10.attn_q.weightQ4_K[2560 2560]
-
blk.10.attn_v.weightQ6_K[2560 2560]
-
blk.11.attn_norm.biasF32[2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_down.weightQ6_K[6912 2560]
-
blk.11.ffn_gate.weightQ4_K[2560 6912]
-
blk.11.ffn_up.weightQ4_K[2560 6912]
-
blk.11.ffn_norm.biasF32[2560]
-
blk.11.ffn_norm.weightF32[2560]
-
blk.11.attn_k.weightQ4_K[2560 2560]
-
blk.11.attn_output.weightQ4_K[2560 2560]
-
blk.11.attn_q.weightQ4_K[2560 2560]
-
blk.11.attn_v.weightQ6_K[2560 2560]
-
blk.12.attn_norm.biasF32[2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_down.weightQ4_K[6912 2560]
-
blk.12.ffn_gate.weightQ4_K[2560 6912]
-
blk.12.ffn_up.weightQ4_K[2560 6912]
-
blk.12.ffn_norm.biasF32[2560]
-
blk.12.ffn_norm.weightF32[2560]
-
blk.12.attn_k.weightQ4_K[2560 2560]
-
blk.12.attn_output.weightQ4_K[2560 2560]
-
blk.12.attn_q.weightQ4_K[2560 2560]
-
blk.12.attn_v.weightQ4_K[2560 2560]
-
blk.13.attn_norm.biasF32[2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_down.weightQ4_K[6912 2560]
-
blk.13.ffn_gate.weightQ4_K[2560 6912]
-
blk.13.ffn_up.weightQ4_K[2560 6912]
-
blk.13.ffn_norm.biasF32[2560]
-
blk.13.ffn_norm.weightF32[2560]
-
blk.13.attn_k.weightQ4_K[2560 2560]
-
blk.13.attn_output.weightQ4_K[2560 2560]
-
blk.13.attn_q.weightQ4_K[2560 2560]
-
blk.13.attn_v.weightQ4_K[2560 2560]
-
blk.14.attn_norm.biasF32[2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_down.weightQ6_K[6912 2560]
-
blk.14.ffn_gate.weightQ4_K[2560 6912]
-
blk.14.ffn_up.weightQ4_K[2560 6912]
-
blk.14.ffn_norm.biasF32[2560]
-
blk.14.ffn_norm.weightF32[2560]
-
blk.14.attn_k.weightQ4_K[2560 2560]
-
blk.14.attn_output.weightQ4_K[2560 2560]
-
blk.14.attn_q.weightQ4_K[2560 2560]
-
blk.14.attn_v.weightQ6_K[2560 2560]
-
blk.15.attn_norm.biasF32[2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_down.weightQ4_K[6912 2560]
-
blk.15.ffn_gate.weightQ4_K[2560 6912]
-
blk.15.ffn_up.weightQ4_K[2560 6912]
-
blk.15.ffn_norm.biasF32[2560]
-
blk.15.ffn_norm.weightF32[2560]
-
blk.15.attn_k.weightQ4_K[2560 2560]
-
blk.15.attn_output.weightQ4_K[2560 2560]
-
blk.15.attn_q.weightQ4_K[2560 2560]
-
blk.15.attn_v.weightQ4_K[2560 2560]
-
blk.16.attn_norm.biasF32[2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_down.weightQ4_K[6912 2560]
-
blk.16.ffn_gate.weightQ4_K[2560 6912]
-
blk.16.ffn_up.weightQ4_K[2560 6912]
-
blk.16.ffn_norm.biasF32[2560]
-
blk.16.ffn_norm.weightF32[2560]
-
blk.16.attn_k.weightQ4_K[2560 2560]
-
blk.16.attn_output.weightQ4_K[2560 2560]
-
blk.16.attn_q.weightQ4_K[2560 2560]
-
blk.16.attn_v.weightQ4_K[2560 2560]
-
blk.17.attn_norm.biasF32[2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_down.weightQ6_K[6912 2560]
-
blk.17.ffn_gate.weightQ4_K[2560 6912]
-
blk.17.ffn_up.weightQ4_K[2560 6912]
-
blk.17.ffn_norm.biasF32[2560]
-
blk.17.ffn_norm.weightF32[2560]
-
blk.17.attn_k.weightQ4_K[2560 2560]
-
blk.17.attn_output.weightQ4_K[2560 2560]
-
blk.17.attn_q.weightQ4_K[2560 2560]
-
blk.17.attn_v.weightQ6_K[2560 2560]
-
blk.18.attn_norm.biasF32[2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_down.weightQ4_K[6912 2560]
-
blk.18.ffn_gate.weightQ4_K[2560 6912]
-
blk.18.ffn_up.weightQ4_K[2560 6912]
-
blk.18.ffn_norm.biasF32[2560]
-
blk.18.ffn_norm.weightF32[2560]
-
blk.18.attn_k.weightQ4_K[2560 2560]
-
blk.18.attn_output.weightQ4_K[2560 2560]
-
blk.18.attn_q.weightQ4_K[2560 2560]
-
blk.18.attn_v.weightQ4_K[2560 2560]
-
blk.19.attn_norm.biasF32[2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_down.weightQ4_K[6912 2560]
-
blk.19.ffn_gate.weightQ4_K[2560 6912]
-
blk.19.ffn_up.weightQ4_K[2560 6912]
-
blk.19.ffn_norm.biasF32[2560]
-
blk.19.ffn_norm.weightF32[2560]
-
blk.19.attn_k.weightQ4_K[2560 2560]
-
blk.19.attn_output.weightQ4_K[2560 2560]
-
blk.19.attn_q.weightQ4_K[2560 2560]
-
blk.19.attn_v.weightQ4_K[2560 2560]
-
blk.20.attn_norm.biasF32[2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_down.weightQ4_K[6912 2560]
-
blk.20.ffn_gate.weightQ4_K[2560 6912]
-
blk.20.ffn_up.weightQ4_K[2560 6912]
-
blk.20.ffn_norm.biasF32[2560]
-
blk.20.ffn_norm.weightF32[2560]
-
blk.20.attn_k.weightQ4_K[2560 2560]
-
blk.20.attn_output.weightQ4_K[2560 2560]
-
blk.20.attn_q.weightQ4_K[2560 2560]
-
blk.20.attn_v.weightQ4_K[2560 2560]
-
blk.21.attn_norm.biasF32[2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_down.weightQ4_K[6912 2560]
-
blk.21.ffn_gate.weightQ4_K[2560 6912]
-
blk.21.ffn_up.weightQ4_K[2560 6912]
-
blk.21.ffn_norm.biasF32[2560]
-
blk.21.ffn_norm.weightF32[2560]
-
blk.21.attn_k.weightQ4_K[2560 2560]
-
blk.21.attn_output.weightQ4_K[2560 2560]
-
blk.21.attn_q.weightQ4_K[2560 2560]
-
blk.21.attn_v.weightQ4_K[2560 2560]
-
blk.22.attn_norm.biasF32[2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_down.weightQ6_K[6912 2560]
-
blk.22.ffn_gate.weightQ4_K[2560 6912]
-
blk.22.ffn_up.weightQ4_K[2560 6912]
-
blk.22.ffn_norm.biasF32[2560]
-
blk.22.ffn_norm.weightF32[2560]
-
blk.22.attn_k.weightQ4_K[2560 2560]
-
blk.22.attn_output.weightQ4_K[2560 2560]
-
blk.22.attn_q.weightQ4_K[2560 2560]
-
blk.22.attn_v.weightQ6_K[2560 2560]
-
blk.23.attn_norm.biasF32[2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_down.weightQ4_K[6912 2560]
-
blk.23.ffn_gate.weightQ4_K[2560 6912]
-
blk.23.ffn_up.weightQ4_K[2560 6912]
-
blk.23.ffn_norm.biasF32[2560]
-
blk.23.ffn_norm.weightF32[2560]
-
blk.23.attn_k.weightQ4_K[2560 2560]
-
blk.23.attn_output.weightQ4_K[2560 2560]
-
blk.23.attn_q.weightQ4_K[2560 2560]
-
blk.23.attn_v.weightQ4_K[2560 2560]
-
blk.24.attn_norm.biasF32[2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_down.weightQ4_K[6912 2560]
-
blk.24.ffn_gate.weightQ4_K[2560 6912]
-
blk.24.ffn_up.weightQ4_K[2560 6912]
-
blk.24.ffn_norm.biasF32[2560]
-
blk.24.ffn_norm.weightF32[2560]
-
blk.24.attn_k.weightQ4_K[2560 2560]
-
blk.24.attn_output.weightQ4_K[2560 2560]
-
blk.24.attn_q.weightQ4_K[2560 2560]
-
blk.24.attn_v.weightQ4_K[2560 2560]
-
blk.25.attn_norm.biasF32[2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_down.weightQ6_K[6912 2560]
-
blk.25.ffn_gate.weightQ4_K[2560 6912]
-
blk.25.ffn_up.weightQ4_K[2560 6912]
-
blk.25.ffn_norm.biasF32[2560]
-
blk.25.ffn_norm.weightF32[2560]
-
blk.25.attn_k.weightQ4_K[2560 2560]
-
blk.25.attn_output.weightQ4_K[2560 2560]
-
blk.25.attn_q.weightQ4_K[2560 2560]
-
blk.25.attn_v.weightQ6_K[2560 2560]
-
blk.26.attn_norm.biasF32[2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_down.weightQ4_K[6912 2560]
-
blk.26.ffn_gate.weightQ4_K[2560 6912]
-
blk.26.ffn_up.weightQ4_K[2560 6912]
-
blk.26.ffn_norm.biasF32[2560]
-
blk.26.ffn_norm.weightF32[2560]
-
blk.26.attn_k.weightQ4_K[2560 2560]
-
blk.26.attn_output.weightQ4_K[2560 2560]
-
blk.26.attn_q.weightQ4_K[2560 2560]
-
blk.26.attn_v.weightQ4_K[2560 2560]
-
blk.27.attn_norm.biasF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_down.weightQ4_K[6912 2560]
-
blk.27.ffn_gate.weightQ4_K[2560 6912]
-
blk.27.ffn_up.weightQ4_K[2560 6912]
-
blk.27.ffn_norm.biasF32[2560]
-
blk.27.ffn_norm.weightF32[2560]
-
blk.27.attn_k.weightQ4_K[2560 2560]
-
blk.27.attn_output.weightQ4_K[2560 2560]
-
blk.27.attn_q.weightQ4_K[2560 2560]
-
blk.27.attn_v.weightQ4_K[2560 2560]
-
blk.28.attn_norm.biasF32[2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_down.weightQ6_K[6912 2560]
-
blk.28.ffn_gate.weightQ4_K[2560 6912]
-
blk.28.ffn_up.weightQ4_K[2560 6912]
-
blk.28.ffn_norm.biasF32[2560]
-
blk.28.ffn_norm.weightF32[2560]
-
blk.28.attn_k.weightQ4_K[2560 2560]
-
blk.28.attn_output.weightQ4_K[2560 2560]
-
blk.28.attn_q.weightQ4_K[2560 2560]
-
blk.28.attn_v.weightQ6_K[2560 2560]
-
blk.29.ffn_gate.weightQ4_K[2560 6912]
-
blk.29.ffn_up.weightQ4_K[2560 6912]
-
blk.29.attn_k.weightQ4_K[2560 2560]
-
blk.29.attn_output.weightQ4_K[2560 2560]
-
blk.29.attn_q.weightQ4_K[2560 2560]
-
blk.29.attn_v.weightQ4_K[2560 2560]
-
blk.29.attn_norm.biasF32[2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_down.weightQ6_K[6912 2560]
-
blk.29.ffn_norm.biasF32[2560]
-
blk.29.ffn_norm.weightF32[2560]
-
blk.30.attn_norm.biasF32[2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_down.weightQ6_K[6912 2560]
-
blk.30.ffn_gate.weightQ4_K[2560 6912]
-
blk.30.ffn_up.weightQ4_K[2560 6912]
-
blk.30.ffn_norm.biasF32[2560]
-
blk.30.ffn_norm.weightF32[2560]
-
blk.30.attn_k.weightQ4_K[2560 2560]
-
blk.30.attn_output.weightQ4_K[2560 2560]
-
blk.30.attn_q.weightQ4_K[2560 2560]
-
blk.30.attn_v.weightQ6_K[2560 2560]
-
blk.31.attn_norm.biasF32[2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_down.weightQ6_K[6912 2560]
-
blk.31.ffn_gate.weightQ4_K[2560 6912]
-
blk.31.ffn_up.weightQ4_K[2560 6912]
-
blk.31.ffn_norm.biasF32[2560]
-
blk.31.ffn_norm.weightF32[2560]
-
blk.31.attn_k.weightQ4_K[2560 2560]
-
blk.31.attn_output.weightQ4_K[2560 2560]
-
blk.31.attn_q.weightQ4_K[2560 2560]
-
blk.31.attn_v.weightQ6_K[2560 2560]
-
output.weightQ6_K[2560 50304]
-
output_norm.biasF32[2560]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31