latest
1.7GB
3B
12 Pulls Updated 3 weeks ago
28bfdfaeba9f · 1.7GB
-
general.architecturestarcoder2
-
general.file_typeQ4_0
-
starcoder2.attention.head_count24
-
starcoder2.attention.head_count_kv2
-
starcoder2.attention.layer_norm_epsilon1e-05
-
starcoder2.block_count30
-
starcoder2.context_length16384
-
starcoder2.embedding_length3072
-
starcoder2.feed_forward_length12288
-
starcoder2.rope.freq_base999999.44
-
tokenizer.ggml.bos_token_id0
-
tokenizer.ggml.eos_token_id0
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ ĠĠĠĠ ĠĠĠĠ ĠĠ Ġ e r ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<|endoftext|> <fim_prefix> <fim_middle> <fim_suffix> <fim_pad> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[3072 49152]
-
blk.0.attn_norm.biasF32[3072]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.ffn_up.biasF32[12288]
-
blk.0.ffn_up.weightQ4_0[3072 12288]
-
blk.0.ffn_down.biasF32[3072]
-
blk.0.ffn_down.weightQ4_0[12288 3072]
-
blk.0.ffn_norm.biasF32[3072]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.attn_k.biasF32[256]
-
blk.0.attn_k.weightQ4_0[3072 256]
-
blk.0.attn_output.biasF32[3072]
-
blk.0.attn_output.weightQ4_0[3072 3072]
-
blk.0.attn_q.biasF32[3072]
-
blk.0.attn_q.weightQ4_0[3072 3072]
-
blk.0.attn_v.biasF32[256]
-
blk.0.attn_v.weightQ4_0[3072 256]
-
blk.1.attn_norm.biasF32[3072]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.ffn_up.biasF32[12288]
-
blk.1.ffn_up.weightQ4_0[3072 12288]
-
blk.1.ffn_down.biasF32[3072]
-
blk.1.ffn_down.weightQ4_0[12288 3072]
-
blk.1.ffn_norm.biasF32[3072]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.attn_k.biasF32[256]
-
blk.1.attn_k.weightQ4_0[3072 256]
-
blk.1.attn_output.biasF32[3072]
-
blk.1.attn_output.weightQ4_0[3072 3072]
-
blk.1.attn_q.biasF32[3072]
-
blk.1.attn_q.weightQ4_0[3072 3072]
-
blk.1.attn_v.biasF32[256]
-
blk.1.attn_v.weightQ4_0[3072 256]
-
blk.2.attn_norm.biasF32[3072]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.ffn_up.biasF32[12288]
-
blk.2.ffn_up.weightQ4_0[3072 12288]
-
blk.2.ffn_down.biasF32[3072]
-
blk.2.ffn_down.weightQ4_0[12288 3072]
-
blk.2.ffn_norm.biasF32[3072]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.attn_k.biasF32[256]
-
blk.2.attn_k.weightQ4_0[3072 256]
-
blk.2.attn_output.biasF32[3072]
-
blk.2.attn_output.weightQ4_0[3072 3072]
-
blk.2.attn_q.biasF32[3072]
-
blk.2.attn_q.weightQ4_0[3072 3072]
-
blk.2.attn_v.biasF32[256]
-
blk.2.attn_v.weightQ4_0[3072 256]
-
blk.3.attn_norm.biasF32[3072]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.ffn_up.biasF32[12288]
-
blk.3.ffn_up.weightQ4_0[3072 12288]
-
blk.3.ffn_down.biasF32[3072]
-
blk.3.ffn_down.weightQ4_0[12288 3072]
-
blk.3.ffn_norm.biasF32[3072]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.attn_k.biasF32[256]
-
blk.3.attn_k.weightQ4_0[3072 256]
-
blk.3.attn_output.biasF32[3072]
-
blk.3.attn_output.weightQ4_0[3072 3072]
-
blk.3.attn_q.biasF32[3072]
-
blk.3.attn_q.weightQ4_0[3072 3072]
-
blk.3.attn_v.biasF32[256]
-
blk.3.attn_v.weightQ4_0[3072 256]
-
blk.4.attn_norm.biasF32[3072]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.ffn_up.biasF32[12288]
-
blk.4.ffn_up.weightQ4_0[3072 12288]
-
blk.4.ffn_down.biasF32[3072]
-
blk.4.ffn_down.weightQ4_0[12288 3072]
-
blk.4.ffn_norm.biasF32[3072]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.attn_k.biasF32[256]
-
blk.4.attn_k.weightQ4_0[3072 256]
-
blk.4.attn_output.biasF32[3072]
-
blk.4.attn_output.weightQ4_0[3072 3072]
-
blk.4.attn_q.biasF32[3072]
-
blk.4.attn_q.weightQ4_0[3072 3072]
-
blk.4.attn_v.biasF32[256]
-
blk.4.attn_v.weightQ4_0[3072 256]
-
blk.5.attn_norm.biasF32[3072]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.ffn_up.biasF32[12288]
-
blk.5.ffn_up.weightQ4_0[3072 12288]
-
blk.5.ffn_down.biasF32[3072]
-
blk.5.ffn_down.weightQ4_0[12288 3072]
-
blk.5.ffn_norm.biasF32[3072]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.attn_k.biasF32[256]
-
blk.5.attn_k.weightQ4_0[3072 256]
-
blk.5.attn_output.biasF32[3072]
-
blk.5.attn_output.weightQ4_0[3072 3072]
-
blk.5.attn_q.biasF32[3072]
-
blk.5.attn_q.weightQ4_0[3072 3072]
-
blk.5.attn_v.biasF32[256]
-
blk.5.attn_v.weightQ4_0[3072 256]
-
blk.6.attn_norm.biasF32[3072]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.ffn_up.biasF32[12288]
-
blk.6.ffn_up.weightQ4_0[3072 12288]
-
blk.6.ffn_down.biasF32[3072]
-
blk.6.ffn_down.weightQ4_0[12288 3072]
-
blk.6.ffn_norm.biasF32[3072]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.attn_k.biasF32[256]
-
blk.6.attn_k.weightQ4_0[3072 256]
-
blk.6.attn_output.biasF32[3072]
-
blk.6.attn_output.weightQ4_0[3072 3072]
-
blk.6.attn_q.biasF32[3072]
-
blk.6.attn_q.weightQ4_0[3072 3072]
-
blk.6.attn_v.biasF32[256]
-
blk.6.attn_v.weightQ4_0[3072 256]
-
blk.7.attn_norm.biasF32[3072]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.ffn_up.biasF32[12288]
-
blk.7.ffn_up.weightQ4_0[3072 12288]
-
blk.7.ffn_down.biasF32[3072]
-
blk.7.ffn_down.weightQ4_0[12288 3072]
-
blk.7.ffn_norm.biasF32[3072]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.attn_k.biasF32[256]
-
blk.7.attn_k.weightQ4_0[3072 256]
-
blk.7.attn_output.biasF32[3072]
-
blk.7.attn_output.weightQ4_0[3072 3072]
-
blk.7.attn_q.biasF32[3072]
-
blk.7.attn_q.weightQ4_0[3072 3072]
-
blk.7.attn_v.biasF32[256]
-
blk.7.attn_v.weightQ4_0[3072 256]
-
blk.8.attn_norm.biasF32[3072]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.ffn_up.biasF32[12288]
-
blk.8.ffn_up.weightQ4_0[3072 12288]
-
blk.8.ffn_down.biasF32[3072]
-
blk.8.ffn_down.weightQ4_0[12288 3072]
-
blk.8.ffn_norm.biasF32[3072]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.attn_k.biasF32[256]
-
blk.8.attn_k.weightQ4_0[3072 256]
-
blk.8.attn_output.biasF32[3072]
-
blk.8.attn_output.weightQ4_0[3072 3072]
-
blk.8.attn_q.biasF32[3072]
-
blk.8.attn_q.weightQ4_0[3072 3072]
-
blk.8.attn_v.biasF32[256]
-
blk.8.attn_v.weightQ4_0[3072 256]
-
blk.9.attn_norm.biasF32[3072]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.ffn_up.biasF32[12288]
-
blk.9.ffn_up.weightQ4_0[3072 12288]
-
blk.9.ffn_down.biasF32[3072]
-
blk.9.ffn_down.weightQ4_0[12288 3072]
-
blk.9.ffn_norm.biasF32[3072]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.attn_k.biasF32[256]
-
blk.9.attn_k.weightQ4_0[3072 256]
-
blk.9.attn_output.biasF32[3072]
-
blk.9.attn_output.weightQ4_0[3072 3072]
-
blk.9.attn_q.biasF32[3072]
-
blk.9.attn_q.weightQ4_0[3072 3072]
-
blk.9.attn_v.biasF32[256]
-
blk.9.attn_v.weightQ4_0[3072 256]
-
blk.10.attn_norm.biasF32[3072]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.ffn_up.biasF32[12288]
-
blk.10.ffn_up.weightQ4_0[3072 12288]
-
blk.10.ffn_down.biasF32[3072]
-
blk.10.ffn_down.weightQ4_0[12288 3072]
-
blk.10.ffn_norm.biasF32[3072]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.attn_k.biasF32[256]
-
blk.10.attn_k.weightQ4_0[3072 256]
-
blk.10.attn_output.biasF32[3072]
-
blk.10.attn_output.weightQ4_0[3072 3072]
-
blk.10.attn_q.biasF32[3072]
-
blk.10.attn_q.weightQ4_0[3072 3072]
-
blk.10.attn_v.biasF32[256]
-
blk.10.attn_v.weightQ4_0[3072 256]
-
blk.11.attn_norm.biasF32[3072]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.ffn_up.biasF32[12288]
-
blk.11.ffn_up.weightQ4_0[3072 12288]
-
blk.11.ffn_down.biasF32[3072]
-
blk.11.ffn_down.weightQ4_0[12288 3072]
-
blk.11.ffn_norm.biasF32[3072]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.attn_k.biasF32[256]
-
blk.11.attn_k.weightQ4_0[3072 256]
-
blk.11.attn_output.biasF32[3072]
-
blk.11.attn_output.weightQ4_0[3072 3072]
-
blk.11.attn_q.biasF32[3072]
-
blk.11.attn_q.weightQ4_0[3072 3072]
-
blk.11.attn_v.biasF32[256]
-
blk.11.attn_v.weightQ4_0[3072 256]
-
blk.12.attn_norm.biasF32[3072]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.ffn_up.biasF32[12288]
-
blk.12.ffn_up.weightQ4_0[3072 12288]
-
blk.12.ffn_down.biasF32[3072]
-
blk.12.ffn_down.weightQ4_0[12288 3072]
-
blk.12.ffn_norm.biasF32[3072]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.attn_k.biasF32[256]
-
blk.12.attn_k.weightQ4_0[3072 256]
-
blk.12.attn_output.biasF32[3072]
-
blk.12.attn_output.weightQ4_0[3072 3072]
-
blk.12.attn_q.biasF32[3072]
-
blk.12.attn_q.weightQ4_0[3072 3072]
-
blk.12.attn_v.biasF32[256]
-
blk.12.attn_v.weightQ4_0[3072 256]
-
blk.13.attn_norm.biasF32[3072]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.ffn_up.biasF32[12288]
-
blk.13.ffn_up.weightQ4_0[3072 12288]
-
blk.13.ffn_down.biasF32[3072]
-
blk.13.ffn_down.weightQ4_0[12288 3072]
-
blk.13.ffn_norm.biasF32[3072]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.attn_k.biasF32[256]
-
blk.13.attn_k.weightQ4_0[3072 256]
-
blk.13.attn_output.biasF32[3072]
-
blk.13.attn_output.weightQ4_0[3072 3072]
-
blk.13.attn_q.biasF32[3072]
-
blk.13.attn_q.weightQ4_0[3072 3072]
-
blk.13.attn_v.biasF32[256]
-
blk.13.attn_v.weightQ4_0[3072 256]
-
blk.14.attn_norm.biasF32[3072]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.ffn_up.biasF32[12288]
-
blk.14.ffn_up.weightQ4_0[3072 12288]
-
blk.14.ffn_down.biasF32[3072]
-
blk.14.ffn_down.weightQ4_0[12288 3072]
-
blk.14.ffn_norm.biasF32[3072]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.attn_k.biasF32[256]
-
blk.14.attn_k.weightQ4_0[3072 256]
-
blk.14.attn_output.biasF32[3072]
-
blk.14.attn_output.weightQ4_0[3072 3072]
-
blk.14.attn_q.biasF32[3072]
-
blk.14.attn_q.weightQ4_0[3072 3072]
-
blk.14.attn_v.biasF32[256]
-
blk.14.attn_v.weightQ4_0[3072 256]
-
blk.15.attn_norm.biasF32[3072]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.ffn_up.biasF32[12288]
-
blk.15.ffn_up.weightQ4_0[3072 12288]
-
blk.15.ffn_down.biasF32[3072]
-
blk.15.ffn_down.weightQ4_0[12288 3072]
-
blk.15.ffn_norm.biasF32[3072]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.attn_k.biasF32[256]
-
blk.15.attn_k.weightQ4_0[3072 256]
-
blk.15.attn_output.biasF32[3072]
-
blk.15.attn_output.weightQ4_0[3072 3072]
-
blk.15.attn_q.biasF32[3072]
-
blk.15.attn_q.weightQ4_0[3072 3072]
-
blk.15.attn_v.biasF32[256]
-
blk.15.attn_v.weightQ4_0[3072 256]
-
blk.16.attn_norm.biasF32[3072]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.ffn_up.biasF32[12288]
-
blk.16.ffn_up.weightQ4_0[3072 12288]
-
blk.16.ffn_down.biasF32[3072]
-
blk.16.ffn_down.weightQ4_0[12288 3072]
-
blk.16.ffn_norm.biasF32[3072]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.attn_k.biasF32[256]
-
blk.16.attn_k.weightQ4_0[3072 256]
-
blk.16.attn_output.biasF32[3072]
-
blk.16.attn_output.weightQ4_0[3072 3072]
-
blk.16.attn_q.biasF32[3072]
-
blk.16.attn_q.weightQ4_0[3072 3072]
-
blk.16.attn_v.biasF32[256]
-
blk.16.attn_v.weightQ4_0[3072 256]
-
blk.17.attn_norm.biasF32[3072]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.ffn_up.biasF32[12288]
-
blk.17.ffn_up.weightQ4_0[3072 12288]
-
blk.17.ffn_down.biasF32[3072]
-
blk.17.ffn_down.weightQ4_0[12288 3072]
-
blk.17.ffn_norm.biasF32[3072]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.attn_k.biasF32[256]
-
blk.17.attn_k.weightQ4_0[3072 256]
-
blk.17.attn_output.biasF32[3072]
-
blk.17.attn_output.weightQ4_0[3072 3072]
-
blk.17.attn_q.biasF32[3072]
-
blk.17.attn_q.weightQ4_0[3072 3072]
-
blk.17.attn_v.biasF32[256]
-
blk.17.attn_v.weightQ4_0[3072 256]
-
blk.18.attn_norm.biasF32[3072]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.ffn_up.biasF32[12288]
-
blk.18.ffn_up.weightQ4_0[3072 12288]
-
blk.18.ffn_down.biasF32[3072]
-
blk.18.ffn_down.weightQ4_0[12288 3072]
-
blk.18.ffn_norm.biasF32[3072]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.attn_k.biasF32[256]
-
blk.18.attn_k.weightQ4_0[3072 256]
-
blk.18.attn_output.biasF32[3072]
-
blk.18.attn_output.weightQ4_0[3072 3072]
-
blk.18.attn_q.biasF32[3072]
-
blk.18.attn_q.weightQ4_0[3072 3072]
-
blk.18.attn_v.biasF32[256]
-
blk.18.attn_v.weightQ4_0[3072 256]
-
blk.19.attn_norm.biasF32[3072]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.ffn_up.biasF32[12288]
-
blk.19.ffn_up.weightQ4_0[3072 12288]
-
blk.19.ffn_down.biasF32[3072]
-
blk.19.ffn_down.weightQ4_0[12288 3072]
-
blk.19.ffn_norm.biasF32[3072]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.attn_k.biasF32[256]
-
blk.19.attn_k.weightQ4_0[3072 256]
-
blk.19.attn_output.biasF32[3072]
-
blk.19.attn_output.weightQ4_0[3072 3072]
-
blk.19.attn_q.biasF32[3072]
-
blk.19.attn_q.weightQ4_0[3072 3072]
-
blk.19.attn_v.biasF32[256]
-
blk.19.attn_v.weightQ4_0[3072 256]
-
blk.20.attn_norm.biasF32[3072]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.ffn_up.biasF32[12288]
-
blk.20.ffn_up.weightQ4_0[3072 12288]
-
blk.20.ffn_down.biasF32[3072]
-
blk.20.ffn_down.weightQ4_0[12288 3072]
-
blk.20.ffn_norm.biasF32[3072]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.attn_k.biasF32[256]
-
blk.20.attn_k.weightQ4_0[3072 256]
-
blk.20.attn_output.biasF32[3072]
-
blk.20.attn_output.weightQ4_0[3072 3072]
-
blk.20.attn_q.biasF32[3072]
-
blk.20.attn_q.weightQ4_0[3072 3072]
-
blk.20.attn_v.biasF32[256]
-
blk.20.attn_v.weightQ4_0[3072 256]
-
blk.21.attn_norm.biasF32[3072]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.ffn_up.biasF32[12288]
-
blk.21.ffn_up.weightQ4_0[3072 12288]
-
blk.21.ffn_down.biasF32[3072]
-
blk.21.ffn_down.weightQ4_0[12288 3072]
-
blk.21.ffn_norm.biasF32[3072]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.attn_k.biasF32[256]
-
blk.21.attn_k.weightQ4_0[3072 256]
-
blk.21.attn_output.biasF32[3072]
-
blk.21.attn_output.weightQ4_0[3072 3072]
-
blk.21.attn_q.biasF32[3072]
-
blk.21.attn_q.weightQ4_0[3072 3072]
-
blk.21.attn_v.biasF32[256]
-
blk.21.attn_v.weightQ4_0[3072 256]
-
blk.22.attn_norm.biasF32[3072]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.ffn_up.biasF32[12288]
-
blk.22.ffn_up.weightQ4_0[3072 12288]
-
blk.22.ffn_down.biasF32[3072]
-
blk.22.ffn_down.weightQ4_0[12288 3072]
-
blk.22.ffn_norm.biasF32[3072]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.attn_k.biasF32[256]
-
blk.22.attn_k.weightQ4_0[3072 256]
-
blk.22.attn_output.biasF32[3072]
-
blk.22.attn_output.weightQ4_0[3072 3072]
-
blk.22.attn_q.biasF32[3072]
-
blk.22.attn_q.weightQ4_0[3072 3072]
-
blk.22.attn_v.biasF32[256]
-
blk.22.attn_v.weightQ4_0[3072 256]
-
blk.23.attn_norm.biasF32[3072]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.ffn_up.biasF32[12288]
-
blk.23.ffn_up.weightQ4_0[3072 12288]
-
blk.23.ffn_down.biasF32[3072]
-
blk.23.ffn_down.weightQ4_0[12288 3072]
-
blk.23.ffn_norm.biasF32[3072]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.attn_k.biasF32[256]
-
blk.23.attn_k.weightQ4_0[3072 256]
-
blk.23.attn_output.biasF32[3072]
-
blk.23.attn_output.weightQ4_0[3072 3072]
-
blk.23.attn_q.biasF32[3072]
-
blk.23.attn_q.weightQ4_0[3072 3072]
-
blk.23.attn_v.biasF32[256]
-
blk.23.attn_v.weightQ4_0[3072 256]
-
blk.24.attn_norm.biasF32[3072]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.ffn_up.biasF32[12288]
-
blk.24.ffn_up.weightQ4_0[3072 12288]
-
blk.24.ffn_down.biasF32[3072]
-
blk.24.ffn_down.weightQ4_0[12288 3072]
-
blk.24.ffn_norm.biasF32[3072]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.attn_k.biasF32[256]
-
blk.24.attn_k.weightQ4_0[3072 256]
-
blk.24.attn_output.biasF32[3072]
-
blk.24.attn_output.weightQ4_0[3072 3072]
-
blk.24.attn_q.biasF32[3072]
-
blk.24.attn_q.weightQ4_0[3072 3072]
-
blk.24.attn_v.biasF32[256]
-
blk.24.attn_v.weightQ4_0[3072 256]
-
blk.25.attn_norm.biasF32[3072]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.ffn_up.biasF32[12288]
-
blk.25.ffn_up.weightQ4_0[3072 12288]
-
blk.25.ffn_down.biasF32[3072]
-
blk.25.ffn_down.weightQ4_0[12288 3072]
-
blk.25.ffn_norm.biasF32[3072]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.attn_k.biasF32[256]
-
blk.25.attn_k.weightQ4_0[3072 256]
-
blk.25.attn_output.biasF32[3072]
-
blk.25.attn_output.weightQ4_0[3072 3072]
-
blk.25.attn_q.biasF32[3072]
-
blk.25.attn_q.weightQ4_0[3072 3072]
-
blk.25.attn_v.biasF32[256]
-
blk.25.attn_v.weightQ4_0[3072 256]
-
blk.26.attn_norm.biasF32[3072]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.ffn_up.biasF32[12288]
-
blk.26.ffn_up.weightQ4_0[3072 12288]
-
blk.26.ffn_down.biasF32[3072]
-
blk.26.ffn_down.weightQ4_0[12288 3072]
-
blk.26.ffn_norm.biasF32[3072]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.attn_k.biasF32[256]
-
blk.26.attn_k.weightQ4_0[3072 256]
-
blk.26.attn_output.biasF32[3072]
-
blk.26.attn_output.weightQ4_0[3072 3072]
-
blk.26.attn_q.biasF32[3072]
-
blk.26.attn_q.weightQ4_0[3072 3072]
-
blk.26.attn_v.biasF32[256]
-
blk.26.attn_v.weightQ4_0[3072 256]
-
blk.27.attn_norm.biasF32[3072]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.ffn_up.biasF32[12288]
-
blk.27.ffn_up.weightQ4_0[3072 12288]
-
blk.27.ffn_down.biasF32[3072]
-
blk.27.ffn_down.weightQ4_0[12288 3072]
-
blk.27.ffn_norm.biasF32[3072]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.attn_k.biasF32[256]
-
blk.27.attn_k.weightQ4_0[3072 256]
-
blk.27.attn_output.biasF32[3072]
-
blk.27.attn_output.weightQ4_0[3072 3072]
-
blk.27.attn_q.biasF32[3072]
-
blk.27.attn_q.weightQ4_0[3072 3072]
-
blk.27.attn_v.biasF32[256]
-
blk.27.attn_v.weightQ4_0[3072 256]
-
blk.28.attn_norm.biasF32[3072]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.ffn_up.biasF32[12288]
-
blk.28.ffn_up.weightQ4_0[3072 12288]
-
blk.28.ffn_down.biasF32[3072]
-
blk.28.ffn_down.weightQ4_0[12288 3072]
-
blk.28.ffn_norm.biasF32[3072]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.attn_k.biasF32[256]
-
blk.28.attn_k.weightQ4_0[3072 256]
-
blk.28.attn_output.biasF32[3072]
-
blk.28.attn_output.weightQ4_0[3072 3072]
-
blk.28.attn_q.biasF32[3072]
-
blk.28.attn_q.weightQ4_0[3072 3072]
-
blk.28.attn_v.biasF32[256]
-
blk.28.attn_v.weightQ4_0[3072 256]
-
blk.29.attn_norm.biasF32[3072]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.ffn_up.biasF32[12288]
-
blk.29.ffn_up.weightQ4_0[3072 12288]
-
blk.29.ffn_down.biasF32[3072]
-
blk.29.ffn_down.weightQ4_0[12288 3072]
-
blk.29.ffn_norm.biasF32[3072]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.attn_k.biasF32[256]
-
blk.29.attn_k.weightQ4_0[3072 256]
-
blk.29.attn_output.biasF32[3072]
-
blk.29.attn_output.weightQ4_0[3072 3072]
-
blk.29.attn_q.biasF32[3072]
-
blk.29.attn_q.weightQ4_0[3072 3072]
-
blk.29.attn_v.biasF32[256]
-
blk.29.attn_v.weightQ4_0[3072 256]
-
output_norm.biasF32[3072]
-
output_norm.weightF32[3072]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29