latest
65GB
32B
Updated 2 days ago
7bb9d39c9d77 · 65GB
-
general.architectureqwen2
-
general.file_typeF16
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27392
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightF16[5120 152064]
-
blk.0.ffn_gate.weightF16[5120 27392]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightF16[5120 1024]
-
blk.0.attn_output.weightF16[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightF16[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightF16[5120 1024]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightF16[27392 5120]
-
blk.0.ffn_up.weightF16[5120 27392]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightF16[27392 5120]
-
blk.1.ffn_gate.weightF16[5120 27392]
-
blk.1.ffn_up.weightF16[5120 27392]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightF16[5120 1024]
-
blk.1.attn_output.weightF16[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightF16[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightF16[5120 1024]
-
blk.2.ffn_gate.weightF16[5120 27392]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightF16[5120 1024]
-
blk.2.attn_output.weightF16[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightF16[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightF16[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightF16[27392 5120]
-
blk.2.ffn_up.weightF16[5120 27392]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightF16[27392 5120]
-
blk.3.ffn_gate.weightF16[5120 27392]
-
blk.3.ffn_up.weightF16[5120 27392]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightF16[5120 1024]
-
blk.3.attn_output.weightF16[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightF16[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightF16[5120 1024]
-
blk.4.ffn_gate.weightF16[5120 27392]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightF16[5120 1024]
-
blk.4.attn_output.weightF16[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightF16[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightF16[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightF16[27392 5120]
-
blk.4.ffn_up.weightF16[5120 27392]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightF16[27392 5120]
-
blk.5.ffn_gate.weightF16[5120 27392]
-
blk.5.ffn_up.weightF16[5120 27392]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightF16[5120 1024]
-
blk.5.attn_output.weightF16[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightF16[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightF16[5120 1024]
-
blk.6.ffn_gate.weightF16[5120 27392]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightF16[5120 1024]
-
blk.6.attn_output.weightF16[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightF16[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightF16[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightF16[27392 5120]
-
blk.6.ffn_up.weightF16[5120 27392]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightF16[27392 5120]
-
blk.7.ffn_gate.weightF16[5120 27392]
-
blk.7.ffn_up.weightF16[5120 27392]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightF16[5120 1024]
-
blk.7.attn_output.weightF16[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightF16[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightF16[5120 1024]
-
blk.8.ffn_gate.weightF16[5120 27392]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightF16[5120 1024]
-
blk.8.attn_output.weightF16[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightF16[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightF16[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightF16[27392 5120]
-
blk.8.ffn_up.weightF16[5120 27392]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightF16[27392 5120]
-
blk.9.ffn_gate.weightF16[5120 27392]
-
blk.9.ffn_up.weightF16[5120 27392]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightF16[5120 1024]
-
blk.9.attn_output.weightF16[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightF16[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightF16[5120 1024]
-
blk.10.ffn_gate.weightF16[5120 27392]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightF16[5120 1024]
-
blk.10.attn_output.weightF16[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightF16[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightF16[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightF16[27392 5120]
-
blk.10.ffn_up.weightF16[5120 27392]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightF16[27392 5120]
-
blk.11.ffn_gate.weightF16[5120 27392]
-
blk.11.ffn_up.weightF16[5120 27392]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightF16[5120 1024]
-
blk.11.attn_output.weightF16[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightF16[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightF16[5120 1024]
-
blk.12.ffn_gate.weightF16[5120 27392]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightF16[5120 1024]
-
blk.12.attn_output.weightF16[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightF16[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightF16[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightF16[27392 5120]
-
blk.12.ffn_up.weightF16[5120 27392]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightF16[27392 5120]
-
blk.13.ffn_gate.weightF16[5120 27392]
-
blk.13.ffn_up.weightF16[5120 27392]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightF16[5120 1024]
-
blk.13.attn_output.weightF16[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightF16[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightF16[5120 1024]
-
blk.14.ffn_gate.weightF16[5120 27392]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightF16[5120 1024]
-
blk.14.attn_output.weightF16[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightF16[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightF16[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightF16[27392 5120]
-
blk.14.ffn_up.weightF16[5120 27392]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightF16[27392 5120]
-
blk.15.ffn_gate.weightF16[5120 27392]
-
blk.15.ffn_up.weightF16[5120 27392]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightF16[5120 1024]
-
blk.15.attn_output.weightF16[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightF16[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightF16[5120 1024]
-
blk.16.ffn_gate.weightF16[5120 27392]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightF16[5120 1024]
-
blk.16.attn_output.weightF16[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightF16[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightF16[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightF16[27392 5120]
-
blk.16.ffn_up.weightF16[5120 27392]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightF16[27392 5120]
-
blk.17.ffn_gate.weightF16[5120 27392]
-
blk.17.ffn_up.weightF16[5120 27392]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightF16[5120 1024]
-
blk.17.attn_output.weightF16[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightF16[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightF16[5120 1024]
-
blk.18.ffn_gate.weightF16[5120 27392]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightF16[5120 1024]
-
blk.18.attn_output.weightF16[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightF16[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightF16[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightF16[27392 5120]
-
blk.18.ffn_up.weightF16[5120 27392]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightF16[27392 5120]
-
blk.19.ffn_gate.weightF16[5120 27392]
-
blk.19.ffn_up.weightF16[5120 27392]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightF16[5120 1024]
-
blk.19.attn_output.weightF16[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightF16[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightF16[5120 1024]
-
blk.20.ffn_gate.weightF16[5120 27392]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightF16[5120 1024]
-
blk.20.attn_output.weightF16[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightF16[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightF16[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightF16[27392 5120]
-
blk.20.ffn_up.weightF16[5120 27392]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightF16[27392 5120]
-
blk.21.ffn_gate.weightF16[5120 27392]
-
blk.21.ffn_up.weightF16[5120 27392]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightF16[5120 1024]
-
blk.21.attn_output.weightF16[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightF16[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightF16[5120 1024]
-
blk.22.ffn_gate.weightF16[5120 27392]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightF16[5120 1024]
-
blk.22.attn_output.weightF16[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightF16[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightF16[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightF16[27392 5120]
-
blk.22.ffn_up.weightF16[5120 27392]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightF16[27392 5120]
-
blk.23.ffn_gate.weightF16[5120 27392]
-
blk.23.ffn_up.weightF16[5120 27392]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightF16[5120 1024]
-
blk.23.attn_output.weightF16[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightF16[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightF16[5120 1024]
-
blk.24.ffn_gate.weightF16[5120 27392]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightF16[5120 1024]
-
blk.24.attn_output.weightF16[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightF16[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightF16[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightF16[27392 5120]
-
blk.24.ffn_up.weightF16[5120 27392]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightF16[27392 5120]
-
blk.25.ffn_gate.weightF16[5120 27392]
-
blk.25.ffn_up.weightF16[5120 27392]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightF16[5120 1024]
-
blk.25.attn_output.weightF16[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightF16[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightF16[5120 1024]
-
blk.26.ffn_gate.weightF16[5120 27392]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightF16[5120 1024]
-
blk.26.attn_output.weightF16[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightF16[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightF16[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightF16[27392 5120]
-
blk.26.ffn_up.weightF16[5120 27392]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightF16[27392 5120]
-
blk.27.ffn_gate.weightF16[5120 27392]
-
blk.27.ffn_up.weightF16[5120 27392]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightF16[5120 1024]
-
blk.27.attn_output.weightF16[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightF16[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightF16[5120 1024]
-
blk.28.ffn_gate.weightF16[5120 27392]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightF16[5120 1024]
-
blk.28.attn_output.weightF16[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightF16[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightF16[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightF16[27392 5120]
-
blk.28.ffn_up.weightF16[5120 27392]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightF16[27392 5120]
-
blk.29.ffn_gate.weightF16[5120 27392]
-
blk.29.ffn_up.weightF16[5120 27392]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightF16[5120 1024]
-
blk.29.attn_output.weightF16[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightF16[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightF16[5120 1024]
-
blk.30.ffn_gate.weightF16[5120 27392]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightF16[5120 1024]
-
blk.30.attn_output.weightF16[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightF16[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightF16[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightF16[27392 5120]
-
blk.30.ffn_up.weightF16[5120 27392]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightF16[27392 5120]
-
blk.31.ffn_gate.weightF16[5120 27392]
-
blk.31.ffn_up.weightF16[5120 27392]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightF16[5120 1024]
-
blk.31.attn_output.weightF16[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightF16[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightF16[5120 1024]
-
blk.32.ffn_gate.weightF16[5120 27392]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightF16[5120 1024]
-
blk.32.attn_output.weightF16[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightF16[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightF16[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightF16[27392 5120]
-
blk.32.ffn_up.weightF16[5120 27392]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightF16[27392 5120]
-
blk.33.ffn_gate.weightF16[5120 27392]
-
blk.33.ffn_up.weightF16[5120 27392]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightF16[5120 1024]
-
blk.33.attn_output.weightF16[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightF16[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightF16[5120 1024]
-
blk.34.ffn_gate.weightF16[5120 27392]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightF16[5120 1024]
-
blk.34.attn_output.weightF16[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightF16[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightF16[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightF16[27392 5120]
-
blk.34.ffn_up.weightF16[5120 27392]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightF16[27392 5120]
-
blk.35.ffn_gate.weightF16[5120 27392]
-
blk.35.ffn_up.weightF16[5120 27392]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightF16[5120 1024]
-
blk.35.attn_output.weightF16[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightF16[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightF16[5120 1024]
-
blk.36.ffn_gate.weightF16[5120 27392]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightF16[5120 1024]
-
blk.36.attn_output.weightF16[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightF16[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightF16[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightF16[27392 5120]
-
blk.36.ffn_up.weightF16[5120 27392]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightF16[27392 5120]
-
blk.37.ffn_gate.weightF16[5120 27392]
-
blk.37.ffn_up.weightF16[5120 27392]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightF16[5120 1024]
-
blk.37.attn_output.weightF16[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightF16[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightF16[5120 1024]
-
blk.38.ffn_gate.weightF16[5120 27392]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightF16[5120 1024]
-
blk.38.attn_output.weightF16[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightF16[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightF16[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightF16[27392 5120]
-
blk.38.ffn_up.weightF16[5120 27392]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightF16[27392 5120]
-
blk.39.ffn_gate.weightF16[5120 27392]
-
blk.39.ffn_up.weightF16[5120 27392]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightF16[5120 1024]
-
blk.39.attn_output.weightF16[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightF16[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightF16[5120 1024]
-
blk.40.ffn_gate.weightF16[5120 27392]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightF16[5120 1024]
-
blk.40.attn_output.weightF16[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightF16[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightF16[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightF16[27392 5120]
-
blk.40.ffn_up.weightF16[5120 27392]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightF16[27392 5120]
-
blk.41.ffn_gate.weightF16[5120 27392]
-
blk.41.ffn_up.weightF16[5120 27392]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightF16[5120 1024]
-
blk.41.attn_output.weightF16[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightF16[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightF16[5120 1024]
-
blk.42.ffn_gate.weightF16[5120 27392]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightF16[5120 1024]
-
blk.42.attn_output.weightF16[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightF16[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightF16[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightF16[27392 5120]
-
blk.42.ffn_up.weightF16[5120 27392]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightF16[27392 5120]
-
blk.43.ffn_gate.weightF16[5120 27392]
-
blk.43.ffn_up.weightF16[5120 27392]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightF16[5120 1024]
-
blk.43.attn_output.weightF16[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightF16[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightF16[5120 1024]
-
blk.44.ffn_gate.weightF16[5120 27392]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightF16[5120 1024]
-
blk.44.attn_output.weightF16[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightF16[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightF16[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightF16[27392 5120]
-
blk.44.ffn_up.weightF16[5120 27392]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightF16[27392 5120]
-
blk.45.ffn_gate.weightF16[5120 27392]
-
blk.45.ffn_up.weightF16[5120 27392]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightF16[5120 1024]
-
blk.45.attn_output.weightF16[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightF16[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightF16[5120 1024]
-
blk.46.ffn_gate.weightF16[5120 27392]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightF16[5120 1024]
-
blk.46.attn_output.weightF16[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightF16[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightF16[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightF16[27392 5120]
-
blk.46.ffn_up.weightF16[5120 27392]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightF16[27392 5120]
-
blk.47.ffn_gate.weightF16[5120 27392]
-
blk.47.ffn_up.weightF16[5120 27392]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightF16[5120 1024]
-
blk.47.attn_output.weightF16[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightF16[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightF16[5120 1024]
-
blk.48.ffn_gate.weightF16[5120 27392]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightF16[5120 1024]
-
blk.48.attn_output.weightF16[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightF16[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightF16[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightF16[27392 5120]
-
blk.48.ffn_up.weightF16[5120 27392]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightF16[27392 5120]
-
blk.49.ffn_gate.weightF16[5120 27392]
-
blk.49.ffn_up.weightF16[5120 27392]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightF16[5120 1024]
-
blk.49.attn_output.weightF16[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightF16[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightF16[5120 1024]
-
blk.50.ffn_gate.weightF16[5120 27392]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightF16[5120 1024]
-
blk.50.attn_output.weightF16[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightF16[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightF16[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightF16[27392 5120]
-
blk.50.ffn_up.weightF16[5120 27392]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightF16[27392 5120]
-
blk.51.ffn_gate.weightF16[5120 27392]
-
blk.51.ffn_up.weightF16[5120 27392]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightF16[5120 1024]
-
blk.51.attn_output.weightF16[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightF16[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightF16[5120 1024]
-
blk.52.ffn_gate.weightF16[5120 27392]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightF16[5120 1024]
-
blk.52.attn_output.weightF16[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightF16[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightF16[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightF16[27392 5120]
-
blk.52.ffn_up.weightF16[5120 27392]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightF16[27392 5120]
-
blk.53.ffn_gate.weightF16[5120 27392]
-
blk.53.ffn_up.weightF16[5120 27392]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightF16[5120 1024]
-
blk.53.attn_output.weightF16[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightF16[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightF16[5120 1024]
-
blk.54.ffn_gate.weightF16[5120 27392]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightF16[5120 1024]
-
blk.54.attn_output.weightF16[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightF16[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightF16[5120 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightF16[27392 5120]
-
blk.54.ffn_up.weightF16[5120 27392]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightF16[27392 5120]
-
blk.55.ffn_gate.weightF16[5120 27392]
-
blk.55.ffn_up.weightF16[5120 27392]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightF16[5120 1024]
-
blk.55.attn_output.weightF16[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightF16[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightF16[5120 1024]
-
blk.56.ffn_gate.weightF16[5120 27392]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightF16[5120 1024]
-
blk.56.attn_output.weightF16[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightF16[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightF16[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightF16[27392 5120]
-
blk.56.ffn_up.weightF16[5120 27392]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightF16[27392 5120]
-
blk.57.ffn_gate.weightF16[5120 27392]
-
blk.57.ffn_up.weightF16[5120 27392]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightF16[5120 1024]
-
blk.57.attn_output.weightF16[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightF16[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightF16[5120 1024]
-
blk.58.ffn_gate.weightF16[5120 27392]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightF16[5120 1024]
-
blk.58.attn_output.weightF16[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightF16[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightF16[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightF16[27392 5120]
-
blk.58.ffn_up.weightF16[5120 27392]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightF16[27392 5120]
-
blk.59.ffn_gate.weightF16[5120 27392]
-
blk.59.ffn_up.weightF16[5120 27392]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightF16[5120 1024]
-
blk.59.attn_output.weightF16[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightF16[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightF16[5120 1024]
-
blk.60.ffn_gate.weightF16[5120 27392]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightF16[5120 1024]
-
blk.60.attn_output.weightF16[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightF16[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightF16[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightF16[27392 5120]
-
blk.60.ffn_up.weightF16[5120 27392]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightF16[27392 5120]
-
blk.61.ffn_gate.weightF16[5120 27392]
-
blk.61.ffn_up.weightF16[5120 27392]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightF16[5120 1024]
-
blk.61.attn_output.weightF16[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightF16[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightF16[5120 1024]
-
blk.62.ffn_gate.weightF16[5120 27392]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightF16[5120 1024]
-
blk.62.attn_output.weightF16[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightF16[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightF16[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightF16[27392 5120]
-
blk.62.ffn_up.weightF16[5120 27392]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightF16[27392 5120]
-
blk.63.ffn_gate.weightF16[5120 27392]
-
blk.63.ffn_up.weightF16[5120 27392]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightF16[5120 1024]
-
blk.63.attn_output.weightF16[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightF16[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightF16[5120 1024]
-
output_norm.weightF32[5120]
-
output.weightF16[5120 152064]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63