yanolja eeve korean model
3B
207 Pulls Updated 3 months ago
2325444508d4 · 3.0GB
-
general.architecturephi2
-
general.file_typeQ8_0
-
phi2.attention.head_count32
-
phi2.attention.head_count_kv32
-
phi2.attention.layer_norm_epsilon1e-05
-
phi2.block_count32
-
phi2.context_length2048
-
phi2.embedding_length2560
-
phi2.feed_forward_length10240
-
phi2.rope.dimension_count32
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id58940
-
tokenizer.ggml.eos_token_id58943
-
tokenizer.ggml.merges[▁ ▁ ▁ ▁▁ ▁▁ ▁ ▁ ▁▁▁ ▁▁ ▁▁ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id58941
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
tokenizer.ggml.unknown_token_id50256
-
NameTypeShape
-
token_embd.weightQ8_0[2560 58944]
-
blk.0.attn_norm.biasF32[2560]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_up.biasF32[10240]
-
blk.0.ffn_up.weightQ8_0[2560 10240]
-
blk.0.ffn_down.biasF32[2560]
-
blk.0.ffn_down.weightQ8_0[10240 2560]
-
blk.0.attn_output.biasF32[2560]
-
blk.0.attn_output.weightQ8_0[2560 2560]
-
blk.0.attn_k.biasF32[2560]
-
blk.0.attn_k.weightQ8_0[2560 2560]
-
blk.0.attn_q.biasF32[2560]
-
blk.0.attn_q.weightQ8_0[2560 2560]
-
blk.0.attn_v.biasF32[2560]
-
blk.0.attn_v.weightQ8_0[2560 2560]
-
blk.1.attn_norm.biasF32[2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_up.biasF32[10240]
-
blk.1.ffn_up.weightQ8_0[2560 10240]
-
blk.1.ffn_down.biasF32[2560]
-
blk.1.ffn_down.weightQ8_0[10240 2560]
-
blk.1.attn_output.biasF32[2560]
-
blk.1.attn_output.weightQ8_0[2560 2560]
-
blk.1.attn_k.biasF32[2560]
-
blk.1.attn_k.weightQ8_0[2560 2560]
-
blk.1.attn_q.biasF32[2560]
-
blk.1.attn_q.weightQ8_0[2560 2560]
-
blk.1.attn_v.biasF32[2560]
-
blk.1.attn_v.weightQ8_0[2560 2560]
-
blk.2.attn_norm.biasF32[2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_up.biasF32[10240]
-
blk.2.ffn_up.weightQ8_0[2560 10240]
-
blk.2.ffn_down.biasF32[2560]
-
blk.2.ffn_down.weightQ8_0[10240 2560]
-
blk.2.attn_output.biasF32[2560]
-
blk.2.attn_output.weightQ8_0[2560 2560]
-
blk.2.attn_k.biasF32[2560]
-
blk.2.attn_k.weightQ8_0[2560 2560]
-
blk.2.attn_q.biasF32[2560]
-
blk.2.attn_q.weightQ8_0[2560 2560]
-
blk.2.attn_v.biasF32[2560]
-
blk.2.attn_v.weightQ8_0[2560 2560]
-
blk.3.attn_norm.biasF32[2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_up.biasF32[10240]
-
blk.3.ffn_up.weightQ8_0[2560 10240]
-
blk.3.ffn_down.biasF32[2560]
-
blk.3.ffn_down.weightQ8_0[10240 2560]
-
blk.3.attn_output.biasF32[2560]
-
blk.3.attn_output.weightQ8_0[2560 2560]
-
blk.3.attn_k.biasF32[2560]
-
blk.3.attn_k.weightQ8_0[2560 2560]
-
blk.3.attn_q.biasF32[2560]
-
blk.3.attn_q.weightQ8_0[2560 2560]
-
blk.3.attn_v.biasF32[2560]
-
blk.3.attn_v.weightQ8_0[2560 2560]
-
blk.4.attn_norm.biasF32[2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_up.biasF32[10240]
-
blk.4.ffn_up.weightQ8_0[2560 10240]
-
blk.4.ffn_down.biasF32[2560]
-
blk.4.ffn_down.weightQ8_0[10240 2560]
-
blk.4.attn_output.biasF32[2560]
-
blk.4.attn_output.weightQ8_0[2560 2560]
-
blk.4.attn_k.biasF32[2560]
-
blk.4.attn_k.weightQ8_0[2560 2560]
-
blk.4.attn_q.biasF32[2560]
-
blk.4.attn_q.weightQ8_0[2560 2560]
-
blk.4.attn_v.biasF32[2560]
-
blk.4.attn_v.weightQ8_0[2560 2560]
-
blk.5.attn_norm.biasF32[2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_up.biasF32[10240]
-
blk.5.ffn_up.weightQ8_0[2560 10240]
-
blk.5.ffn_down.biasF32[2560]
-
blk.5.ffn_down.weightQ8_0[10240 2560]
-
blk.5.attn_output.biasF32[2560]
-
blk.5.attn_output.weightQ8_0[2560 2560]
-
blk.5.attn_k.biasF32[2560]
-
blk.5.attn_k.weightQ8_0[2560 2560]
-
blk.5.attn_q.biasF32[2560]
-
blk.5.attn_q.weightQ8_0[2560 2560]
-
blk.5.attn_v.biasF32[2560]
-
blk.5.attn_v.weightQ8_0[2560 2560]
-
blk.6.attn_norm.biasF32[2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_up.biasF32[10240]
-
blk.6.ffn_up.weightQ8_0[2560 10240]
-
blk.6.ffn_down.biasF32[2560]
-
blk.6.ffn_down.weightQ8_0[10240 2560]
-
blk.6.attn_output.biasF32[2560]
-
blk.6.attn_output.weightQ8_0[2560 2560]
-
blk.6.attn_k.biasF32[2560]
-
blk.6.attn_k.weightQ8_0[2560 2560]
-
blk.6.attn_q.biasF32[2560]
-
blk.6.attn_q.weightQ8_0[2560 2560]
-
blk.6.attn_v.biasF32[2560]
-
blk.6.attn_v.weightQ8_0[2560 2560]
-
blk.7.attn_norm.biasF32[2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_up.biasF32[10240]
-
blk.7.ffn_up.weightQ8_0[2560 10240]
-
blk.7.ffn_down.biasF32[2560]
-
blk.7.ffn_down.weightQ8_0[10240 2560]
-
blk.7.attn_output.biasF32[2560]
-
blk.7.attn_output.weightQ8_0[2560 2560]
-
blk.7.attn_k.biasF32[2560]
-
blk.7.attn_k.weightQ8_0[2560 2560]
-
blk.7.attn_q.biasF32[2560]
-
blk.7.attn_q.weightQ8_0[2560 2560]
-
blk.7.attn_v.biasF32[2560]
-
blk.7.attn_v.weightQ8_0[2560 2560]
-
blk.8.attn_norm.biasF32[2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_up.biasF32[10240]
-
blk.8.ffn_up.weightQ8_0[2560 10240]
-
blk.8.ffn_down.biasF32[2560]
-
blk.8.ffn_down.weightQ8_0[10240 2560]
-
blk.8.attn_output.biasF32[2560]
-
blk.8.attn_output.weightQ8_0[2560 2560]
-
blk.8.attn_k.biasF32[2560]
-
blk.8.attn_k.weightQ8_0[2560 2560]
-
blk.8.attn_q.biasF32[2560]
-
blk.8.attn_q.weightQ8_0[2560 2560]
-
blk.8.attn_v.biasF32[2560]
-
blk.8.attn_v.weightQ8_0[2560 2560]
-
blk.9.attn_norm.biasF32[2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_up.biasF32[10240]
-
blk.9.ffn_up.weightQ8_0[2560 10240]
-
blk.9.ffn_down.biasF32[2560]
-
blk.9.ffn_down.weightQ8_0[10240 2560]
-
blk.9.attn_output.biasF32[2560]
-
blk.9.attn_output.weightQ8_0[2560 2560]
-
blk.9.attn_k.biasF32[2560]
-
blk.9.attn_k.weightQ8_0[2560 2560]
-
blk.9.attn_q.biasF32[2560]
-
blk.9.attn_q.weightQ8_0[2560 2560]
-
blk.9.attn_v.biasF32[2560]
-
blk.9.attn_v.weightQ8_0[2560 2560]
-
blk.10.attn_norm.biasF32[2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_up.biasF32[10240]
-
blk.10.ffn_up.weightQ8_0[2560 10240]
-
blk.10.ffn_down.biasF32[2560]
-
blk.10.ffn_down.weightQ8_0[10240 2560]
-
blk.10.attn_output.biasF32[2560]
-
blk.10.attn_output.weightQ8_0[2560 2560]
-
blk.10.attn_k.biasF32[2560]
-
blk.10.attn_k.weightQ8_0[2560 2560]
-
blk.10.attn_q.biasF32[2560]
-
blk.10.attn_q.weightQ8_0[2560 2560]
-
blk.10.attn_v.biasF32[2560]
-
blk.10.attn_v.weightQ8_0[2560 2560]
-
blk.11.attn_norm.biasF32[2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_up.biasF32[10240]
-
blk.11.ffn_up.weightQ8_0[2560 10240]
-
blk.11.ffn_down.biasF32[2560]
-
blk.11.ffn_down.weightQ8_0[10240 2560]
-
blk.11.attn_output.biasF32[2560]
-
blk.11.attn_output.weightQ8_0[2560 2560]
-
blk.11.attn_k.biasF32[2560]
-
blk.11.attn_k.weightQ8_0[2560 2560]
-
blk.11.attn_q.biasF32[2560]
-
blk.11.attn_q.weightQ8_0[2560 2560]
-
blk.11.attn_v.biasF32[2560]
-
blk.11.attn_v.weightQ8_0[2560 2560]
-
blk.12.attn_norm.biasF32[2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_up.biasF32[10240]
-
blk.12.ffn_up.weightQ8_0[2560 10240]
-
blk.12.ffn_down.biasF32[2560]
-
blk.12.ffn_down.weightQ8_0[10240 2560]
-
blk.12.attn_output.biasF32[2560]
-
blk.12.attn_output.weightQ8_0[2560 2560]
-
blk.12.attn_k.biasF32[2560]
-
blk.12.attn_k.weightQ8_0[2560 2560]
-
blk.12.attn_q.biasF32[2560]
-
blk.12.attn_q.weightQ8_0[2560 2560]
-
blk.12.attn_v.biasF32[2560]
-
blk.12.attn_v.weightQ8_0[2560 2560]
-
blk.13.attn_norm.biasF32[2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_up.biasF32[10240]
-
blk.13.ffn_up.weightQ8_0[2560 10240]
-
blk.13.ffn_down.biasF32[2560]
-
blk.13.ffn_down.weightQ8_0[10240 2560]
-
blk.13.attn_output.biasF32[2560]
-
blk.13.attn_output.weightQ8_0[2560 2560]
-
blk.13.attn_k.biasF32[2560]
-
blk.13.attn_k.weightQ8_0[2560 2560]
-
blk.13.attn_q.biasF32[2560]
-
blk.13.attn_q.weightQ8_0[2560 2560]
-
blk.13.attn_v.biasF32[2560]
-
blk.13.attn_v.weightQ8_0[2560 2560]
-
blk.14.attn_norm.biasF32[2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_up.biasF32[10240]
-
blk.14.ffn_up.weightQ8_0[2560 10240]
-
blk.14.ffn_down.biasF32[2560]
-
blk.14.ffn_down.weightQ8_0[10240 2560]
-
blk.14.attn_output.biasF32[2560]
-
blk.14.attn_output.weightQ8_0[2560 2560]
-
blk.14.attn_k.biasF32[2560]
-
blk.14.attn_k.weightQ8_0[2560 2560]
-
blk.14.attn_q.biasF32[2560]
-
blk.14.attn_q.weightQ8_0[2560 2560]
-
blk.14.attn_v.biasF32[2560]
-
blk.14.attn_v.weightQ8_0[2560 2560]
-
blk.15.attn_norm.biasF32[2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_up.biasF32[10240]
-
blk.15.ffn_up.weightQ8_0[2560 10240]
-
blk.15.ffn_down.biasF32[2560]
-
blk.15.ffn_down.weightQ8_0[10240 2560]
-
blk.15.attn_output.biasF32[2560]
-
blk.15.attn_output.weightQ8_0[2560 2560]
-
blk.15.attn_k.biasF32[2560]
-
blk.15.attn_k.weightQ8_0[2560 2560]
-
blk.15.attn_q.biasF32[2560]
-
blk.15.attn_q.weightQ8_0[2560 2560]
-
blk.15.attn_v.biasF32[2560]
-
blk.15.attn_v.weightQ8_0[2560 2560]
-
blk.16.attn_norm.biasF32[2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_up.biasF32[10240]
-
blk.16.ffn_up.weightQ8_0[2560 10240]
-
blk.16.ffn_down.biasF32[2560]
-
blk.16.ffn_down.weightQ8_0[10240 2560]
-
blk.16.attn_output.biasF32[2560]
-
blk.16.attn_output.weightQ8_0[2560 2560]
-
blk.16.attn_k.biasF32[2560]
-
blk.16.attn_k.weightQ8_0[2560 2560]
-
blk.16.attn_q.biasF32[2560]
-
blk.16.attn_q.weightQ8_0[2560 2560]
-
blk.16.attn_v.biasF32[2560]
-
blk.16.attn_v.weightQ8_0[2560 2560]
-
blk.17.attn_norm.biasF32[2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_up.biasF32[10240]
-
blk.17.ffn_up.weightQ8_0[2560 10240]
-
blk.17.ffn_down.biasF32[2560]
-
blk.17.ffn_down.weightQ8_0[10240 2560]
-
blk.17.attn_output.biasF32[2560]
-
blk.17.attn_output.weightQ8_0[2560 2560]
-
blk.17.attn_k.biasF32[2560]
-
blk.17.attn_k.weightQ8_0[2560 2560]
-
blk.17.attn_q.biasF32[2560]
-
blk.17.attn_q.weightQ8_0[2560 2560]
-
blk.17.attn_v.biasF32[2560]
-
blk.17.attn_v.weightQ8_0[2560 2560]
-
blk.18.attn_norm.biasF32[2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_up.biasF32[10240]
-
blk.18.ffn_up.weightQ8_0[2560 10240]
-
blk.18.ffn_down.biasF32[2560]
-
blk.18.ffn_down.weightQ8_0[10240 2560]
-
blk.18.attn_output.biasF32[2560]
-
blk.18.attn_output.weightQ8_0[2560 2560]
-
blk.18.attn_k.biasF32[2560]
-
blk.18.attn_k.weightQ8_0[2560 2560]
-
blk.18.attn_q.biasF32[2560]
-
blk.18.attn_q.weightQ8_0[2560 2560]
-
blk.18.attn_v.biasF32[2560]
-
blk.18.attn_v.weightQ8_0[2560 2560]
-
blk.19.attn_norm.biasF32[2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_up.biasF32[10240]
-
blk.19.ffn_up.weightQ8_0[2560 10240]
-
blk.19.ffn_down.biasF32[2560]
-
blk.19.ffn_down.weightQ8_0[10240 2560]
-
blk.19.attn_output.biasF32[2560]
-
blk.19.attn_output.weightQ8_0[2560 2560]
-
blk.19.attn_k.biasF32[2560]
-
blk.19.attn_k.weightQ8_0[2560 2560]
-
blk.19.attn_q.biasF32[2560]
-
blk.19.attn_q.weightQ8_0[2560 2560]
-
blk.19.attn_v.biasF32[2560]
-
blk.19.attn_v.weightQ8_0[2560 2560]
-
blk.20.attn_norm.biasF32[2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_up.biasF32[10240]
-
blk.20.ffn_up.weightQ8_0[2560 10240]
-
blk.20.ffn_down.biasF32[2560]
-
blk.20.ffn_down.weightQ8_0[10240 2560]
-
blk.20.attn_output.biasF32[2560]
-
blk.20.attn_output.weightQ8_0[2560 2560]
-
blk.20.attn_k.biasF32[2560]
-
blk.20.attn_k.weightQ8_0[2560 2560]
-
blk.20.attn_q.biasF32[2560]
-
blk.20.attn_q.weightQ8_0[2560 2560]
-
blk.20.attn_v.biasF32[2560]
-
blk.20.attn_v.weightQ8_0[2560 2560]
-
blk.21.attn_norm.biasF32[2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_up.biasF32[10240]
-
blk.21.ffn_up.weightQ8_0[2560 10240]
-
blk.21.ffn_down.biasF32[2560]
-
blk.21.ffn_down.weightQ8_0[10240 2560]
-
blk.21.attn_output.biasF32[2560]
-
blk.21.attn_output.weightQ8_0[2560 2560]
-
blk.21.attn_k.biasF32[2560]
-
blk.21.attn_k.weightQ8_0[2560 2560]
-
blk.21.attn_q.biasF32[2560]
-
blk.21.attn_q.weightQ8_0[2560 2560]
-
blk.21.attn_v.biasF32[2560]
-
blk.21.attn_v.weightQ8_0[2560 2560]
-
blk.22.attn_norm.biasF32[2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_up.biasF32[10240]
-
blk.22.ffn_up.weightQ8_0[2560 10240]
-
blk.22.ffn_down.biasF32[2560]
-
blk.22.ffn_down.weightQ8_0[10240 2560]
-
blk.22.attn_output.biasF32[2560]
-
blk.22.attn_output.weightQ8_0[2560 2560]
-
blk.22.attn_k.biasF32[2560]
-
blk.22.attn_k.weightQ8_0[2560 2560]
-
blk.22.attn_q.biasF32[2560]
-
blk.22.attn_q.weightQ8_0[2560 2560]
-
blk.22.attn_v.biasF32[2560]
-
blk.22.attn_v.weightQ8_0[2560 2560]
-
blk.23.attn_norm.biasF32[2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_up.biasF32[10240]
-
blk.23.ffn_up.weightQ8_0[2560 10240]
-
blk.23.ffn_down.biasF32[2560]
-
blk.23.ffn_down.weightQ8_0[10240 2560]
-
blk.23.attn_output.biasF32[2560]
-
blk.23.attn_output.weightQ8_0[2560 2560]
-
blk.23.attn_k.biasF32[2560]
-
blk.23.attn_k.weightQ8_0[2560 2560]
-
blk.23.attn_q.biasF32[2560]
-
blk.23.attn_q.weightQ8_0[2560 2560]
-
blk.23.attn_v.biasF32[2560]
-
blk.23.attn_v.weightQ8_0[2560 2560]
-
blk.24.attn_norm.biasF32[2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_up.biasF32[10240]
-
blk.24.ffn_up.weightQ8_0[2560 10240]
-
blk.24.ffn_down.biasF32[2560]
-
blk.24.ffn_down.weightQ8_0[10240 2560]
-
blk.24.attn_output.biasF32[2560]
-
blk.24.attn_output.weightQ8_0[2560 2560]
-
blk.24.attn_k.biasF32[2560]
-
blk.24.attn_k.weightQ8_0[2560 2560]
-
blk.24.attn_q.biasF32[2560]
-
blk.24.attn_q.weightQ8_0[2560 2560]
-
blk.24.attn_v.biasF32[2560]
-
blk.24.attn_v.weightQ8_0[2560 2560]
-
blk.25.attn_norm.biasF32[2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_up.biasF32[10240]
-
blk.25.ffn_up.weightQ8_0[2560 10240]
-
blk.25.ffn_down.biasF32[2560]
-
blk.25.ffn_down.weightQ8_0[10240 2560]
-
blk.25.attn_output.biasF32[2560]
-
blk.25.attn_output.weightQ8_0[2560 2560]
-
blk.25.attn_k.biasF32[2560]
-
blk.25.attn_k.weightQ8_0[2560 2560]
-
blk.25.attn_q.biasF32[2560]
-
blk.25.attn_q.weightQ8_0[2560 2560]
-
blk.25.attn_v.biasF32[2560]
-
blk.25.attn_v.weightQ8_0[2560 2560]
-
blk.26.attn_norm.biasF32[2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_up.biasF32[10240]
-
blk.26.ffn_up.weightQ8_0[2560 10240]
-
blk.26.ffn_down.biasF32[2560]
-
blk.26.ffn_down.weightQ8_0[10240 2560]
-
blk.26.attn_output.biasF32[2560]
-
blk.26.attn_output.weightQ8_0[2560 2560]
-
blk.26.attn_k.biasF32[2560]
-
blk.26.attn_k.weightQ8_0[2560 2560]
-
blk.26.attn_q.biasF32[2560]
-
blk.26.attn_q.weightQ8_0[2560 2560]
-
blk.26.attn_v.biasF32[2560]
-
blk.26.attn_v.weightQ8_0[2560 2560]
-
blk.27.attn_norm.biasF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_up.biasF32[10240]
-
blk.27.ffn_up.weightQ8_0[2560 10240]
-
blk.27.ffn_down.biasF32[2560]
-
blk.27.ffn_down.weightQ8_0[10240 2560]
-
blk.27.attn_output.biasF32[2560]
-
blk.27.attn_output.weightQ8_0[2560 2560]
-
blk.27.attn_k.biasF32[2560]
-
blk.27.attn_k.weightQ8_0[2560 2560]
-
blk.27.attn_q.biasF32[2560]
-
blk.27.attn_q.weightQ8_0[2560 2560]
-
blk.27.attn_v.biasF32[2560]
-
blk.27.attn_v.weightQ8_0[2560 2560]
-
blk.28.attn_norm.biasF32[2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_up.biasF32[10240]
-
blk.28.ffn_up.weightQ8_0[2560 10240]
-
blk.28.ffn_down.biasF32[2560]
-
blk.28.ffn_down.weightQ8_0[10240 2560]
-
blk.28.attn_output.biasF32[2560]
-
blk.28.attn_output.weightQ8_0[2560 2560]
-
blk.28.attn_k.biasF32[2560]
-
blk.28.attn_k.weightQ8_0[2560 2560]
-
blk.28.attn_q.biasF32[2560]
-
blk.28.attn_q.weightQ8_0[2560 2560]
-
blk.28.attn_v.biasF32[2560]
-
blk.28.attn_v.weightQ8_0[2560 2560]
-
blk.29.ffn_up.biasF32[10240]
-
blk.29.ffn_up.weightQ8_0[2560 10240]
-
blk.29.attn_output.biasF32[2560]
-
blk.29.attn_output.weightQ8_0[2560 2560]
-
blk.29.attn_k.biasF32[2560]
-
blk.29.attn_k.weightQ8_0[2560 2560]
-
blk.29.attn_q.biasF32[2560]
-
blk.29.attn_q.weightQ8_0[2560 2560]
-
blk.29.attn_v.biasF32[2560]
-
blk.29.attn_v.weightQ8_0[2560 2560]
-
blk.29.attn_norm.biasF32[2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_down.biasF32[2560]
-
blk.29.ffn_down.weightQ8_0[10240 2560]
-
blk.30.attn_norm.biasF32[2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_up.biasF32[10240]
-
blk.30.ffn_up.weightQ8_0[2560 10240]
-
blk.30.ffn_down.biasF32[2560]
-
blk.30.ffn_down.weightQ8_0[10240 2560]
-
blk.30.attn_output.biasF32[2560]
-
blk.30.attn_output.weightQ8_0[2560 2560]
-
blk.30.attn_k.biasF32[2560]
-
blk.30.attn_k.weightQ8_0[2560 2560]
-
blk.30.attn_q.biasF32[2560]
-
blk.30.attn_q.weightQ8_0[2560 2560]
-
blk.30.attn_v.biasF32[2560]
-
blk.30.attn_v.weightQ8_0[2560 2560]
-
blk.31.attn_norm.biasF32[2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_up.biasF32[10240]
-
blk.31.ffn_up.weightQ8_0[2560 10240]
-
blk.31.ffn_down.biasF32[2560]
-
blk.31.ffn_down.weightQ8_0[10240 2560]
-
blk.31.attn_output.biasF32[2560]
-
blk.31.attn_output.weightQ8_0[2560 2560]
-
blk.31.attn_k.biasF32[2560]
-
blk.31.attn_k.weightQ8_0[2560 2560]
-
blk.31.attn_q.biasF32[2560]
-
blk.31.attn_q.weightQ8_0[2560 2560]
-
blk.31.attn_v.biasF32[2560]
-
blk.31.attn_v.weightQ8_0[2560 2560]
-
output.biasF32[58944]
-
output.weightQ8_0[2560 58944]
-
output_norm.biasF32[2560]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31