latest
8.1GB
CodeS is a series of Code LLMs specifically optimized for SQL generation.
3 Pulls Updated 3 weeks ago
1bb751d0b03c · 8.1GB
-
general.architecturestarcoder
-
general.file_typeQ8_0
-
starcoder.attention.head_count32
-
starcoder.attention.head_count_kv1
-
starcoder.attention.layer_norm_epsilon1e-05
-
starcoder.block_count42
-
starcoder.context_length8192
-
starcoder.embedding_length4096
-
starcoder.feed_forward_length16384
-
tokenizer.ggml.bos_token_id0
-
tokenizer.ggml.eos_token_id0
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ ĠĠĠĠ ĠĠĠĠ ĠĠ Ġ e r ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.prerefact
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<|endoftext|> <fim_prefix> <fim_middle> <fim_suffix> <fim_pad> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ8_0[4096 49152]
-
position_embd.weightF32[4096 8192]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_norm.biasF32[4096]
-
blk.0.attn_qkv.weightQ8_0[4096 4352]
-
blk.0.attn_qkv.biasF32[4352]
-
blk.0.attn_output.weightQ8_0[4096 4096]
-
blk.0.attn_output.biasF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_norm.biasF32[4096]
-
blk.0.ffn_up.weightQ8_0[4096 16384]
-
blk.0.ffn_up.biasF32[16384]
-
blk.0.ffn_down.weightQ8_0[16384 4096]
-
blk.0.ffn_down.biasF32[4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_norm.biasF32[4096]
-
blk.1.attn_qkv.weightQ8_0[4096 4352]
-
blk.1.attn_qkv.biasF32[4352]
-
blk.1.attn_output.weightQ8_0[4096 4096]
-
blk.1.attn_output.biasF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_norm.biasF32[4096]
-
blk.1.ffn_up.weightQ8_0[4096 16384]
-
blk.1.ffn_up.biasF32[16384]
-
blk.1.ffn_down.weightQ8_0[16384 4096]
-
blk.1.ffn_down.biasF32[4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_norm.biasF32[4096]
-
blk.2.attn_qkv.weightQ8_0[4096 4352]
-
blk.2.attn_qkv.biasF32[4352]
-
blk.2.attn_output.weightQ8_0[4096 4096]
-
blk.2.attn_output.biasF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_norm.biasF32[4096]
-
blk.2.ffn_up.weightQ8_0[4096 16384]
-
blk.2.ffn_up.biasF32[16384]
-
blk.2.ffn_down.weightQ8_0[16384 4096]
-
blk.2.ffn_down.biasF32[4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_norm.biasF32[4096]
-
blk.3.attn_qkv.weightQ8_0[4096 4352]
-
blk.3.attn_qkv.biasF32[4352]
-
blk.3.attn_output.weightQ8_0[4096 4096]
-
blk.3.attn_output.biasF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_norm.biasF32[4096]
-
blk.3.ffn_up.weightQ8_0[4096 16384]
-
blk.3.ffn_up.biasF32[16384]
-
blk.3.ffn_down.weightQ8_0[16384 4096]
-
blk.3.ffn_down.biasF32[4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_norm.biasF32[4096]
-
blk.4.attn_qkv.weightQ8_0[4096 4352]
-
blk.4.attn_qkv.biasF32[4352]
-
blk.4.attn_output.weightQ8_0[4096 4096]
-
blk.4.attn_output.biasF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_norm.biasF32[4096]
-
blk.4.ffn_up.weightQ8_0[4096 16384]
-
blk.4.ffn_up.biasF32[16384]
-
blk.4.ffn_down.weightQ8_0[16384 4096]
-
blk.4.ffn_down.biasF32[4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_norm.biasF32[4096]
-
blk.5.attn_qkv.weightQ8_0[4096 4352]
-
blk.5.attn_qkv.biasF32[4352]
-
blk.5.attn_output.weightQ8_0[4096 4096]
-
blk.5.attn_output.biasF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_norm.biasF32[4096]
-
blk.5.ffn_up.weightQ8_0[4096 16384]
-
blk.5.ffn_up.biasF32[16384]
-
blk.5.ffn_down.weightQ8_0[16384 4096]
-
blk.5.ffn_down.biasF32[4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_norm.biasF32[4096]
-
blk.6.attn_qkv.weightQ8_0[4096 4352]
-
blk.6.attn_qkv.biasF32[4352]
-
blk.6.attn_output.weightQ8_0[4096 4096]
-
blk.6.attn_output.biasF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_norm.biasF32[4096]
-
blk.6.ffn_up.weightQ8_0[4096 16384]
-
blk.6.ffn_up.biasF32[16384]
-
blk.6.ffn_down.weightQ8_0[16384 4096]
-
blk.6.ffn_down.biasF32[4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_norm.biasF32[4096]
-
blk.7.attn_qkv.weightQ8_0[4096 4352]
-
blk.7.attn_qkv.biasF32[4352]
-
blk.7.attn_output.weightQ8_0[4096 4096]
-
blk.7.attn_output.biasF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_norm.biasF32[4096]
-
blk.7.ffn_up.weightQ8_0[4096 16384]
-
blk.7.ffn_up.biasF32[16384]
-
blk.7.ffn_down.weightQ8_0[16384 4096]
-
blk.7.ffn_down.biasF32[4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_norm.biasF32[4096]
-
blk.8.attn_qkv.weightQ8_0[4096 4352]
-
blk.8.attn_qkv.biasF32[4352]
-
blk.8.attn_output.weightQ8_0[4096 4096]
-
blk.8.attn_output.biasF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_norm.biasF32[4096]
-
blk.8.ffn_up.weightQ8_0[4096 16384]
-
blk.8.ffn_up.biasF32[16384]
-
blk.8.ffn_down.weightQ8_0[16384 4096]
-
blk.8.ffn_down.biasF32[4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_norm.biasF32[4096]
-
blk.9.attn_qkv.weightQ8_0[4096 4352]
-
blk.9.attn_qkv.biasF32[4352]
-
blk.9.attn_output.weightQ8_0[4096 4096]
-
blk.9.attn_output.biasF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_norm.biasF32[4096]
-
blk.9.ffn_up.weightQ8_0[4096 16384]
-
blk.9.ffn_up.biasF32[16384]
-
blk.9.ffn_down.weightQ8_0[16384 4096]
-
blk.9.ffn_down.biasF32[4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_norm.biasF32[4096]
-
blk.10.attn_qkv.weightQ8_0[4096 4352]
-
blk.10.attn_qkv.biasF32[4352]
-
blk.10.attn_output.weightQ8_0[4096 4096]
-
blk.10.attn_output.biasF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_norm.biasF32[4096]
-
blk.10.ffn_up.weightQ8_0[4096 16384]
-
blk.10.ffn_up.biasF32[16384]
-
blk.10.ffn_down.weightQ8_0[16384 4096]
-
blk.10.ffn_down.biasF32[4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_norm.biasF32[4096]
-
blk.11.attn_qkv.weightQ8_0[4096 4352]
-
blk.11.attn_qkv.biasF32[4352]
-
blk.11.attn_output.weightQ8_0[4096 4096]
-
blk.11.attn_output.biasF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_norm.biasF32[4096]
-
blk.11.ffn_up.weightQ8_0[4096 16384]
-
blk.11.ffn_up.biasF32[16384]
-
blk.11.ffn_down.weightQ8_0[16384 4096]
-
blk.11.ffn_down.biasF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_norm.biasF32[4096]
-
blk.12.attn_qkv.weightQ8_0[4096 4352]
-
blk.12.attn_qkv.biasF32[4352]
-
blk.12.attn_output.weightQ8_0[4096 4096]
-
blk.12.attn_output.biasF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_norm.biasF32[4096]
-
blk.12.ffn_up.weightQ8_0[4096 16384]
-
blk.12.ffn_up.biasF32[16384]
-
blk.12.ffn_down.weightQ8_0[16384 4096]
-
blk.12.ffn_down.biasF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_norm.biasF32[4096]
-
blk.13.attn_qkv.weightQ8_0[4096 4352]
-
blk.13.attn_qkv.biasF32[4352]
-
blk.13.attn_output.weightQ8_0[4096 4096]
-
blk.13.attn_output.biasF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_norm.biasF32[4096]
-
blk.13.ffn_up.weightQ8_0[4096 16384]
-
blk.13.ffn_up.biasF32[16384]
-
blk.13.ffn_down.weightQ8_0[16384 4096]
-
blk.13.ffn_down.biasF32[4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_norm.biasF32[4096]
-
blk.14.attn_qkv.weightQ8_0[4096 4352]
-
blk.14.attn_qkv.biasF32[4352]
-
blk.14.attn_output.weightQ8_0[4096 4096]
-
blk.14.attn_output.biasF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_norm.biasF32[4096]
-
blk.14.ffn_up.weightQ8_0[4096 16384]
-
blk.14.ffn_up.biasF32[16384]
-
blk.14.ffn_down.weightQ8_0[16384 4096]
-
blk.14.ffn_down.biasF32[4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_norm.biasF32[4096]
-
blk.15.attn_qkv.weightQ8_0[4096 4352]
-
blk.15.attn_qkv.biasF32[4352]
-
blk.15.attn_output.weightQ8_0[4096 4096]
-
blk.15.attn_output.biasF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_norm.biasF32[4096]
-
blk.15.ffn_up.weightQ8_0[4096 16384]
-
blk.15.ffn_up.biasF32[16384]
-
blk.15.ffn_down.weightQ8_0[16384 4096]
-
blk.15.ffn_down.biasF32[4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_norm.biasF32[4096]
-
blk.16.attn_qkv.weightQ8_0[4096 4352]
-
blk.16.attn_qkv.biasF32[4352]
-
blk.16.attn_output.weightQ8_0[4096 4096]
-
blk.16.attn_output.biasF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_norm.biasF32[4096]
-
blk.16.ffn_up.weightQ8_0[4096 16384]
-
blk.16.ffn_up.biasF32[16384]
-
blk.16.ffn_down.weightQ8_0[16384 4096]
-
blk.16.ffn_down.biasF32[4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_norm.biasF32[4096]
-
blk.17.attn_qkv.weightQ8_0[4096 4352]
-
blk.17.attn_qkv.biasF32[4352]
-
blk.17.attn_output.weightQ8_0[4096 4096]
-
blk.17.attn_output.biasF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_norm.biasF32[4096]
-
blk.17.ffn_up.weightQ8_0[4096 16384]
-
blk.17.ffn_up.biasF32[16384]
-
blk.17.ffn_down.weightQ8_0[16384 4096]
-
blk.17.ffn_down.biasF32[4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_norm.biasF32[4096]
-
blk.18.attn_qkv.weightQ8_0[4096 4352]
-
blk.18.attn_qkv.biasF32[4352]
-
blk.18.attn_output.weightQ8_0[4096 4096]
-
blk.18.attn_output.biasF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_norm.biasF32[4096]
-
blk.18.ffn_up.weightQ8_0[4096 16384]
-
blk.18.ffn_up.biasF32[16384]
-
blk.18.ffn_down.weightQ8_0[16384 4096]
-
blk.18.ffn_down.biasF32[4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_norm.biasF32[4096]
-
blk.19.attn_qkv.weightQ8_0[4096 4352]
-
blk.19.attn_qkv.biasF32[4352]
-
blk.19.attn_output.weightQ8_0[4096 4096]
-
blk.19.attn_output.biasF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_norm.biasF32[4096]
-
blk.19.ffn_up.weightQ8_0[4096 16384]
-
blk.19.ffn_up.biasF32[16384]
-
blk.19.ffn_down.weightQ8_0[16384 4096]
-
blk.19.ffn_down.biasF32[4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_norm.biasF32[4096]
-
blk.20.attn_qkv.weightQ8_0[4096 4352]
-
blk.20.attn_qkv.biasF32[4352]
-
blk.20.attn_output.weightQ8_0[4096 4096]
-
blk.20.attn_output.biasF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_norm.biasF32[4096]
-
blk.20.ffn_up.weightQ8_0[4096 16384]
-
blk.20.ffn_up.biasF32[16384]
-
blk.20.ffn_down.weightQ8_0[16384 4096]
-
blk.20.ffn_down.biasF32[4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_norm.biasF32[4096]
-
blk.21.attn_qkv.weightQ8_0[4096 4352]
-
blk.21.attn_qkv.biasF32[4352]
-
blk.21.attn_output.weightQ8_0[4096 4096]
-
blk.21.attn_output.biasF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_norm.biasF32[4096]
-
blk.21.ffn_up.weightQ8_0[4096 16384]
-
blk.21.ffn_up.biasF32[16384]
-
blk.21.ffn_down.weightQ8_0[16384 4096]
-
blk.21.ffn_down.biasF32[4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_norm.biasF32[4096]
-
blk.22.attn_qkv.weightQ8_0[4096 4352]
-
blk.22.attn_qkv.biasF32[4352]
-
blk.22.attn_output.weightQ8_0[4096 4096]
-
blk.22.attn_output.biasF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_norm.biasF32[4096]
-
blk.22.ffn_up.weightQ8_0[4096 16384]
-
blk.22.ffn_up.biasF32[16384]
-
blk.22.ffn_down.weightQ8_0[16384 4096]
-
blk.22.ffn_down.biasF32[4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_norm.biasF32[4096]
-
blk.23.attn_qkv.weightQ8_0[4096 4352]
-
blk.23.attn_qkv.biasF32[4352]
-
blk.23.attn_output.weightQ8_0[4096 4096]
-
blk.23.attn_output.biasF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_norm.biasF32[4096]
-
blk.23.ffn_up.weightQ8_0[4096 16384]
-
blk.23.ffn_up.biasF32[16384]
-
blk.23.ffn_down.weightQ8_0[16384 4096]
-
blk.23.ffn_down.biasF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_norm.biasF32[4096]
-
blk.24.attn_qkv.weightQ8_0[4096 4352]
-
blk.24.attn_qkv.biasF32[4352]
-
blk.24.attn_output.weightQ8_0[4096 4096]
-
blk.24.attn_output.biasF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_norm.biasF32[4096]
-
blk.24.ffn_up.weightQ8_0[4096 16384]
-
blk.24.ffn_up.biasF32[16384]
-
blk.24.ffn_down.weightQ8_0[16384 4096]
-
blk.24.ffn_down.biasF32[4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_norm.biasF32[4096]
-
blk.25.attn_qkv.weightQ8_0[4096 4352]
-
blk.25.attn_qkv.biasF32[4352]
-
blk.25.attn_output.weightQ8_0[4096 4096]
-
blk.25.attn_output.biasF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_norm.biasF32[4096]
-
blk.25.ffn_up.weightQ8_0[4096 16384]
-
blk.25.ffn_up.biasF32[16384]
-
blk.25.ffn_down.weightQ8_0[16384 4096]
-
blk.25.ffn_down.biasF32[4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_norm.biasF32[4096]
-
blk.26.attn_qkv.weightQ8_0[4096 4352]
-
blk.26.attn_qkv.biasF32[4352]
-
blk.26.attn_output.weightQ8_0[4096 4096]
-
blk.26.attn_output.biasF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_norm.biasF32[4096]
-
blk.26.ffn_up.weightQ8_0[4096 16384]
-
blk.26.ffn_up.biasF32[16384]
-
blk.26.ffn_down.weightQ8_0[16384 4096]
-
blk.26.ffn_down.biasF32[4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_norm.biasF32[4096]
-
blk.27.attn_qkv.weightQ8_0[4096 4352]
-
blk.27.attn_qkv.biasF32[4352]
-
blk.27.attn_output.weightQ8_0[4096 4096]
-
blk.27.attn_output.biasF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_norm.biasF32[4096]
-
blk.27.ffn_up.weightQ8_0[4096 16384]
-
blk.27.ffn_up.biasF32[16384]
-
blk.27.ffn_down.weightQ8_0[16384 4096]
-
blk.27.ffn_down.biasF32[4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_norm.biasF32[4096]
-
blk.28.attn_qkv.weightQ8_0[4096 4352]
-
blk.28.attn_qkv.biasF32[4352]
-
blk.28.attn_output.weightQ8_0[4096 4096]
-
blk.28.attn_output.biasF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_norm.biasF32[4096]
-
blk.28.ffn_up.weightQ8_0[4096 16384]
-
blk.28.ffn_up.biasF32[16384]
-
blk.28.ffn_down.weightQ8_0[16384 4096]
-
blk.28.ffn_down.biasF32[4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_norm.biasF32[4096]
-
blk.29.attn_qkv.weightQ8_0[4096 4352]
-
blk.29.attn_qkv.biasF32[4352]
-
blk.29.attn_output.weightQ8_0[4096 4096]
-
blk.29.attn_output.biasF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_norm.biasF32[4096]
-
blk.29.ffn_up.weightQ8_0[4096 16384]
-
blk.29.ffn_up.biasF32[16384]
-
blk.29.ffn_down.weightQ8_0[16384 4096]
-
blk.29.ffn_down.biasF32[4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_norm.biasF32[4096]
-
blk.30.attn_qkv.weightQ8_0[4096 4352]
-
blk.30.attn_qkv.biasF32[4352]
-
blk.30.attn_output.weightQ8_0[4096 4096]
-
blk.30.attn_output.biasF32[4096]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_norm.biasF32[4096]
-
blk.30.ffn_up.weightQ8_0[4096 16384]
-
blk.30.ffn_up.biasF32[16384]
-
blk.30.ffn_down.weightQ8_0[16384 4096]
-
blk.30.ffn_down.biasF32[4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_norm.biasF32[4096]
-
blk.31.attn_qkv.weightQ8_0[4096 4352]
-
blk.31.attn_qkv.biasF32[4352]
-
blk.31.attn_output.weightQ8_0[4096 4096]
-
blk.31.attn_output.biasF32[4096]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_norm.biasF32[4096]
-
blk.31.ffn_up.weightQ8_0[4096 16384]
-
blk.31.ffn_up.biasF32[16384]
-
blk.31.ffn_down.weightQ8_0[16384 4096]
-
blk.31.ffn_down.biasF32[4096]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_norm.biasF32[4096]
-
blk.32.attn_qkv.weightQ8_0[4096 4352]
-
blk.32.attn_qkv.biasF32[4352]
-
blk.32.attn_output.weightQ8_0[4096 4096]
-
blk.32.attn_output.biasF32[4096]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_norm.biasF32[4096]
-
blk.32.ffn_up.weightQ8_0[4096 16384]
-
blk.32.ffn_up.biasF32[16384]
-
blk.32.ffn_down.weightQ8_0[16384 4096]
-
blk.32.ffn_down.biasF32[4096]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_norm.biasF32[4096]
-
blk.33.attn_qkv.weightQ8_0[4096 4352]
-
blk.33.attn_qkv.biasF32[4352]
-
blk.33.attn_output.weightQ8_0[4096 4096]
-
blk.33.attn_output.biasF32[4096]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_norm.biasF32[4096]
-
blk.33.ffn_up.weightQ8_0[4096 16384]
-
blk.33.ffn_up.biasF32[16384]
-
blk.33.ffn_down.weightQ8_0[16384 4096]
-
blk.33.ffn_down.biasF32[4096]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_norm.biasF32[4096]
-
blk.34.attn_qkv.weightQ8_0[4096 4352]
-
blk.34.attn_qkv.biasF32[4352]
-
blk.34.attn_output.weightQ8_0[4096 4096]
-
blk.34.attn_output.biasF32[4096]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_norm.biasF32[4096]
-
blk.34.ffn_up.weightQ8_0[4096 16384]
-
blk.34.ffn_up.biasF32[16384]
-
blk.34.ffn_down.weightQ8_0[16384 4096]
-
blk.34.ffn_down.biasF32[4096]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_norm.biasF32[4096]
-
blk.35.attn_qkv.weightQ8_0[4096 4352]
-
blk.35.attn_qkv.biasF32[4352]
-
blk.35.attn_output.weightQ8_0[4096 4096]
-
blk.35.attn_output.biasF32[4096]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_norm.biasF32[4096]
-
blk.35.ffn_up.weightQ8_0[4096 16384]
-
blk.35.ffn_up.biasF32[16384]
-
blk.35.ffn_down.weightQ8_0[16384 4096]
-
blk.35.ffn_down.biasF32[4096]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_norm.biasF32[4096]
-
blk.36.attn_qkv.weightQ8_0[4096 4352]
-
blk.36.attn_qkv.biasF32[4352]
-
blk.36.attn_output.weightQ8_0[4096 4096]
-
blk.36.attn_output.biasF32[4096]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_norm.biasF32[4096]
-
blk.36.ffn_up.weightQ8_0[4096 16384]
-
blk.36.ffn_up.biasF32[16384]
-
blk.36.ffn_down.weightQ8_0[16384 4096]
-
blk.36.ffn_down.biasF32[4096]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_norm.biasF32[4096]
-
blk.37.attn_qkv.weightQ8_0[4096 4352]
-
blk.37.attn_qkv.biasF32[4352]
-
blk.37.attn_output.weightQ8_0[4096 4096]
-
blk.37.attn_output.biasF32[4096]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_norm.biasF32[4096]
-
blk.37.ffn_up.weightQ8_0[4096 16384]
-
blk.37.ffn_up.biasF32[16384]
-
blk.37.ffn_down.weightQ8_0[16384 4096]
-
blk.37.ffn_down.biasF32[4096]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_norm.biasF32[4096]
-
blk.38.attn_qkv.weightQ8_0[4096 4352]
-
blk.38.attn_qkv.biasF32[4352]
-
blk.38.attn_output.weightQ8_0[4096 4096]
-
blk.38.attn_output.biasF32[4096]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_norm.biasF32[4096]
-
blk.38.ffn_up.weightQ8_0[4096 16384]
-
blk.38.ffn_up.biasF32[16384]
-
blk.38.ffn_down.weightQ8_0[16384 4096]
-
blk.38.ffn_down.biasF32[4096]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_norm.biasF32[4096]
-
blk.39.attn_qkv.weightQ8_0[4096 4352]
-
blk.39.attn_qkv.biasF32[4352]
-
blk.39.attn_output.weightQ8_0[4096 4096]
-
blk.39.attn_output.biasF32[4096]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_norm.biasF32[4096]
-
blk.39.ffn_up.weightQ8_0[4096 16384]
-
blk.39.ffn_up.biasF32[16384]
-
blk.39.ffn_down.weightQ8_0[16384 4096]
-
blk.39.ffn_down.biasF32[4096]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_norm.biasF32[4096]
-
blk.40.attn_qkv.weightQ8_0[4096 4352]
-
blk.40.attn_qkv.biasF32[4352]
-
blk.40.attn_output.weightQ8_0[4096 4096]
-
blk.40.attn_output.biasF32[4096]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_norm.biasF32[4096]
-
blk.40.ffn_up.weightQ8_0[4096 16384]
-
blk.40.ffn_up.biasF32[16384]
-
blk.40.ffn_down.weightQ8_0[16384 4096]
-
blk.40.ffn_down.biasF32[4096]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_norm.biasF32[4096]
-
blk.41.attn_qkv.weightQ8_0[4096 4352]
-
blk.41.attn_qkv.biasF32[4352]
-
blk.41.attn_output.weightQ8_0[4096 4096]
-
blk.41.attn_output.biasF32[4096]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_norm.biasF32[4096]
-
blk.41.ffn_up.weightQ8_0[4096 16384]
-
blk.41.ffn_up.biasF32[16384]
-
blk.41.ffn_down.weightQ8_0[16384 4096]
-
blk.41.ffn_down.biasF32[4096]
-
output.weightQ8_0[4096 49152]
-
output_norm.weightF32[4096]
-
output_norm.biasF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41