latest
65GB
32B
9 Pulls Updated 3 months ago
4d33c9ae11f4 · 65GB
-
general.architectureqwen2
-
general.file_typeF16
-
qwen2.attention.head_count40
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count64
-
qwen2.context_length32768
-
qwen2.embedding_length5120
-
qwen2.feed_forward_length27392
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightF16[5120 152064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightF16[27392 5120]
-
blk.0.ffn_gate.weightF16[5120 27392]
-
blk.0.ffn_up.weightF16[5120 27392]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightF16[5120 1024]
-
blk.0.attn_output.weightF16[5120 5120]
-
blk.0.attn_q.biasF32[5120]
-
blk.0.attn_q.weightF16[5120 5120]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightF16[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightF16[27392 5120]
-
blk.1.ffn_gate.weightF16[5120 27392]
-
blk.1.ffn_up.weightF16[5120 27392]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightF16[5120 1024]
-
blk.1.attn_output.weightF16[5120 5120]
-
blk.1.attn_q.biasF32[5120]
-
blk.1.attn_q.weightF16[5120 5120]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightF16[5120 1024]
-
blk.2.ffn_gate.weightF16[5120 27392]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightF16[5120 1024]
-
blk.2.attn_output.weightF16[5120 5120]
-
blk.2.attn_q.biasF32[5120]
-
blk.2.attn_q.weightF16[5120 5120]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightF16[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightF16[27392 5120]
-
blk.2.ffn_up.weightF16[5120 27392]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightF16[27392 5120]
-
blk.3.ffn_gate.weightF16[5120 27392]
-
blk.3.ffn_up.weightF16[5120 27392]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightF16[5120 1024]
-
blk.3.attn_output.weightF16[5120 5120]
-
blk.3.attn_q.biasF32[5120]
-
blk.3.attn_q.weightF16[5120 5120]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightF16[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightF16[27392 5120]
-
blk.4.ffn_gate.weightF16[5120 27392]
-
blk.4.ffn_up.weightF16[5120 27392]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightF16[5120 1024]
-
blk.4.attn_output.weightF16[5120 5120]
-
blk.4.attn_q.biasF32[5120]
-
blk.4.attn_q.weightF16[5120 5120]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightF16[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightF16[27392 5120]
-
blk.5.ffn_gate.weightF16[5120 27392]
-
blk.5.ffn_up.weightF16[5120 27392]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightF16[5120 1024]
-
blk.5.attn_output.weightF16[5120 5120]
-
blk.5.attn_q.biasF32[5120]
-
blk.5.attn_q.weightF16[5120 5120]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightF16[5120 1024]
-
blk.6.ffn_gate.weightF16[5120 27392]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightF16[5120 1024]
-
blk.6.attn_output.weightF16[5120 5120]
-
blk.6.attn_q.biasF32[5120]
-
blk.6.attn_q.weightF16[5120 5120]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightF16[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightF16[27392 5120]
-
blk.6.ffn_up.weightF16[5120 27392]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightF16[27392 5120]
-
blk.7.ffn_gate.weightF16[5120 27392]
-
blk.7.ffn_up.weightF16[5120 27392]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightF16[5120 1024]
-
blk.7.attn_output.weightF16[5120 5120]
-
blk.7.attn_q.biasF32[5120]
-
blk.7.attn_q.weightF16[5120 5120]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightF16[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightF16[27392 5120]
-
blk.8.ffn_gate.weightF16[5120 27392]
-
blk.8.ffn_up.weightF16[5120 27392]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightF16[5120 1024]
-
blk.8.attn_output.weightF16[5120 5120]
-
blk.8.attn_q.biasF32[5120]
-
blk.8.attn_q.weightF16[5120 5120]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightF16[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightF16[27392 5120]
-
blk.9.ffn_gate.weightF16[5120 27392]
-
blk.9.ffn_up.weightF16[5120 27392]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightF16[5120 1024]
-
blk.9.attn_output.weightF16[5120 5120]
-
blk.9.attn_q.biasF32[5120]
-
blk.9.attn_q.weightF16[5120 5120]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightF16[5120 1024]
-
blk.10.ffn_gate.weightF16[5120 27392]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightF16[5120 1024]
-
blk.10.attn_output.weightF16[5120 5120]
-
blk.10.attn_q.biasF32[5120]
-
blk.10.attn_q.weightF16[5120 5120]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightF16[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightF16[27392 5120]
-
blk.10.ffn_up.weightF16[5120 27392]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightF16[27392 5120]
-
blk.11.ffn_gate.weightF16[5120 27392]
-
blk.11.ffn_up.weightF16[5120 27392]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightF16[5120 1024]
-
blk.11.attn_output.weightF16[5120 5120]
-
blk.11.attn_q.biasF32[5120]
-
blk.11.attn_q.weightF16[5120 5120]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightF16[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightF16[27392 5120]
-
blk.12.ffn_gate.weightF16[5120 27392]
-
blk.12.ffn_up.weightF16[5120 27392]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightF16[5120 1024]
-
blk.12.attn_output.weightF16[5120 5120]
-
blk.12.attn_q.biasF32[5120]
-
blk.12.attn_q.weightF16[5120 5120]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightF16[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightF16[27392 5120]
-
blk.13.ffn_gate.weightF16[5120 27392]
-
blk.13.ffn_up.weightF16[5120 27392]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightF16[5120 1024]
-
blk.13.attn_output.weightF16[5120 5120]
-
blk.13.attn_q.biasF32[5120]
-
blk.13.attn_q.weightF16[5120 5120]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightF16[5120 1024]
-
blk.14.ffn_gate.weightF16[5120 27392]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightF16[5120 1024]
-
blk.14.attn_output.weightF16[5120 5120]
-
blk.14.attn_q.biasF32[5120]
-
blk.14.attn_q.weightF16[5120 5120]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightF16[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightF16[27392 5120]
-
blk.14.ffn_up.weightF16[5120 27392]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightF16[27392 5120]
-
blk.15.ffn_gate.weightF16[5120 27392]
-
blk.15.ffn_up.weightF16[5120 27392]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightF16[5120 1024]
-
blk.15.attn_output.weightF16[5120 5120]
-
blk.15.attn_q.biasF32[5120]
-
blk.15.attn_q.weightF16[5120 5120]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightF16[5120 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightF16[27392 5120]
-
blk.16.ffn_gate.weightF16[5120 27392]
-
blk.16.ffn_up.weightF16[5120 27392]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightF16[5120 1024]
-
blk.16.attn_output.weightF16[5120 5120]
-
blk.16.attn_q.biasF32[5120]
-
blk.16.attn_q.weightF16[5120 5120]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightF16[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightF16[27392 5120]
-
blk.17.ffn_gate.weightF16[5120 27392]
-
blk.17.ffn_up.weightF16[5120 27392]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightF16[5120 1024]
-
blk.17.attn_output.weightF16[5120 5120]
-
blk.17.attn_q.biasF32[5120]
-
blk.17.attn_q.weightF16[5120 5120]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightF16[5120 1024]
-
blk.18.ffn_gate.weightF16[5120 27392]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightF16[5120 1024]
-
blk.18.attn_output.weightF16[5120 5120]
-
blk.18.attn_q.biasF32[5120]
-
blk.18.attn_q.weightF16[5120 5120]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightF16[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightF16[27392 5120]
-
blk.18.ffn_up.weightF16[5120 27392]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightF16[27392 5120]
-
blk.19.ffn_gate.weightF16[5120 27392]
-
blk.19.ffn_up.weightF16[5120 27392]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightF16[5120 1024]
-
blk.19.attn_output.weightF16[5120 5120]
-
blk.19.attn_q.biasF32[5120]
-
blk.19.attn_q.weightF16[5120 5120]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightF16[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightF16[27392 5120]
-
blk.20.ffn_gate.weightF16[5120 27392]
-
blk.20.ffn_up.weightF16[5120 27392]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightF16[5120 1024]
-
blk.20.attn_output.weightF16[5120 5120]
-
blk.20.attn_q.biasF32[5120]
-
blk.20.attn_q.weightF16[5120 5120]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightF16[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightF16[27392 5120]
-
blk.21.ffn_gate.weightF16[5120 27392]
-
blk.21.ffn_up.weightF16[5120 27392]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightF16[5120 1024]
-
blk.21.attn_output.weightF16[5120 5120]
-
blk.21.attn_q.biasF32[5120]
-
blk.21.attn_q.weightF16[5120 5120]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightF16[5120 1024]
-
blk.22.ffn_gate.weightF16[5120 27392]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightF16[5120 1024]
-
blk.22.attn_output.weightF16[5120 5120]
-
blk.22.attn_q.biasF32[5120]
-
blk.22.attn_q.weightF16[5120 5120]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightF16[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightF16[27392 5120]
-
blk.22.ffn_up.weightF16[5120 27392]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightF16[27392 5120]
-
blk.23.ffn_gate.weightF16[5120 27392]
-
blk.23.ffn_up.weightF16[5120 27392]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightF16[5120 1024]
-
blk.23.attn_output.weightF16[5120 5120]
-
blk.23.attn_q.biasF32[5120]
-
blk.23.attn_q.weightF16[5120 5120]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightF16[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightF16[27392 5120]
-
blk.24.ffn_gate.weightF16[5120 27392]
-
blk.24.ffn_up.weightF16[5120 27392]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightF16[5120 1024]
-
blk.24.attn_output.weightF16[5120 5120]
-
blk.24.attn_q.biasF32[5120]
-
blk.24.attn_q.weightF16[5120 5120]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightF16[5120 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightF16[27392 5120]
-
blk.25.ffn_gate.weightF16[5120 27392]
-
blk.25.ffn_up.weightF16[5120 27392]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightF16[5120 1024]
-
blk.25.attn_output.weightF16[5120 5120]
-
blk.25.attn_q.biasF32[5120]
-
blk.25.attn_q.weightF16[5120 5120]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightF16[5120 1024]
-
blk.26.ffn_gate.weightF16[5120 27392]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightF16[5120 1024]
-
blk.26.attn_output.weightF16[5120 5120]
-
blk.26.attn_q.biasF32[5120]
-
blk.26.attn_q.weightF16[5120 5120]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightF16[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightF16[27392 5120]
-
blk.26.ffn_up.weightF16[5120 27392]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightF16[27392 5120]
-
blk.27.ffn_gate.weightF16[5120 27392]
-
blk.27.ffn_up.weightF16[5120 27392]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightF16[5120 1024]
-
blk.27.attn_output.weightF16[5120 5120]
-
blk.27.attn_q.biasF32[5120]
-
blk.27.attn_q.weightF16[5120 5120]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightF16[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightF16[27392 5120]
-
blk.28.ffn_gate.weightF16[5120 27392]
-
blk.28.ffn_up.weightF16[5120 27392]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightF16[5120 1024]
-
blk.28.attn_output.weightF16[5120 5120]
-
blk.28.attn_q.biasF32[5120]
-
blk.28.attn_q.weightF16[5120 5120]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightF16[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightF16[27392 5120]
-
blk.29.ffn_gate.weightF16[5120 27392]
-
blk.29.ffn_up.weightF16[5120 27392]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightF16[5120 1024]
-
blk.29.attn_output.weightF16[5120 5120]
-
blk.29.attn_q.biasF32[5120]
-
blk.29.attn_q.weightF16[5120 5120]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightF16[5120 1024]
-
blk.30.ffn_gate.weightF16[5120 27392]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightF16[5120 1024]
-
blk.30.attn_output.weightF16[5120 5120]
-
blk.30.attn_q.biasF32[5120]
-
blk.30.attn_q.weightF16[5120 5120]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightF16[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightF16[27392 5120]
-
blk.30.ffn_up.weightF16[5120 27392]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightF16[27392 5120]
-
blk.31.ffn_gate.weightF16[5120 27392]
-
blk.31.ffn_up.weightF16[5120 27392]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightF16[5120 1024]
-
blk.31.attn_output.weightF16[5120 5120]
-
blk.31.attn_q.biasF32[5120]
-
blk.31.attn_q.weightF16[5120 5120]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightF16[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightF16[27392 5120]
-
blk.32.ffn_gate.weightF16[5120 27392]
-
blk.32.ffn_up.weightF16[5120 27392]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightF16[5120 1024]
-
blk.32.attn_output.weightF16[5120 5120]
-
blk.32.attn_q.biasF32[5120]
-
blk.32.attn_q.weightF16[5120 5120]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightF16[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightF16[27392 5120]
-
blk.33.ffn_gate.weightF16[5120 27392]
-
blk.33.ffn_up.weightF16[5120 27392]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightF16[5120 1024]
-
blk.33.attn_output.weightF16[5120 5120]
-
blk.33.attn_q.biasF32[5120]
-
blk.33.attn_q.weightF16[5120 5120]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightF16[5120 1024]
-
blk.34.ffn_gate.weightF16[5120 27392]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightF16[5120 1024]
-
blk.34.attn_output.weightF16[5120 5120]
-
blk.34.attn_q.biasF32[5120]
-
blk.34.attn_q.weightF16[5120 5120]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightF16[5120 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightF16[27392 5120]
-
blk.34.ffn_up.weightF16[5120 27392]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightF16[27392 5120]
-
blk.35.ffn_gate.weightF16[5120 27392]
-
blk.35.ffn_up.weightF16[5120 27392]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightF16[5120 1024]
-
blk.35.attn_output.weightF16[5120 5120]
-
blk.35.attn_q.biasF32[5120]
-
blk.35.attn_q.weightF16[5120 5120]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightF16[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightF16[27392 5120]
-
blk.36.ffn_gate.weightF16[5120 27392]
-
blk.36.ffn_up.weightF16[5120 27392]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightF16[5120 1024]
-
blk.36.attn_output.weightF16[5120 5120]
-
blk.36.attn_q.biasF32[5120]
-
blk.36.attn_q.weightF16[5120 5120]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightF16[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightF16[27392 5120]
-
blk.37.ffn_gate.weightF16[5120 27392]
-
blk.37.ffn_up.weightF16[5120 27392]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightF16[5120 1024]
-
blk.37.attn_output.weightF16[5120 5120]
-
blk.37.attn_q.biasF32[5120]
-
blk.37.attn_q.weightF16[5120 5120]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightF16[5120 1024]
-
blk.38.ffn_gate.weightF16[5120 27392]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightF16[5120 1024]
-
blk.38.attn_output.weightF16[5120 5120]
-
blk.38.attn_q.biasF32[5120]
-
blk.38.attn_q.weightF16[5120 5120]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightF16[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightF16[27392 5120]
-
blk.38.ffn_up.weightF16[5120 27392]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightF16[27392 5120]
-
blk.39.ffn_gate.weightF16[5120 27392]
-
blk.39.ffn_up.weightF16[5120 27392]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightF16[5120 1024]
-
blk.39.attn_output.weightF16[5120 5120]
-
blk.39.attn_q.biasF32[5120]
-
blk.39.attn_q.weightF16[5120 5120]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightF16[5120 1024]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightF16[27392 5120]
-
blk.40.ffn_gate.weightF16[5120 27392]
-
blk.40.ffn_up.weightF16[5120 27392]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightF16[5120 1024]
-
blk.40.attn_output.weightF16[5120 5120]
-
blk.40.attn_q.biasF32[5120]
-
blk.40.attn_q.weightF16[5120 5120]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightF16[5120 1024]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightF16[27392 5120]
-
blk.41.ffn_gate.weightF16[5120 27392]
-
blk.41.ffn_up.weightF16[5120 27392]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightF16[5120 1024]
-
blk.41.attn_output.weightF16[5120 5120]
-
blk.41.attn_q.biasF32[5120]
-
blk.41.attn_q.weightF16[5120 5120]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightF16[5120 1024]
-
blk.42.ffn_gate.weightF16[5120 27392]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightF16[5120 1024]
-
blk.42.attn_output.weightF16[5120 5120]
-
blk.42.attn_q.biasF32[5120]
-
blk.42.attn_q.weightF16[5120 5120]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightF16[5120 1024]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightF16[27392 5120]
-
blk.42.ffn_up.weightF16[5120 27392]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightF16[27392 5120]
-
blk.43.ffn_gate.weightF16[5120 27392]
-
blk.43.ffn_up.weightF16[5120 27392]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightF16[5120 1024]
-
blk.43.attn_output.weightF16[5120 5120]
-
blk.43.attn_q.biasF32[5120]
-
blk.43.attn_q.weightF16[5120 5120]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightF16[5120 1024]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightF16[27392 5120]
-
blk.44.ffn_gate.weightF16[5120 27392]
-
blk.44.ffn_up.weightF16[5120 27392]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightF16[5120 1024]
-
blk.44.attn_output.weightF16[5120 5120]
-
blk.44.attn_q.biasF32[5120]
-
blk.44.attn_q.weightF16[5120 5120]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightF16[5120 1024]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightF16[27392 5120]
-
blk.45.ffn_gate.weightF16[5120 27392]
-
blk.45.ffn_up.weightF16[5120 27392]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightF16[5120 1024]
-
blk.45.attn_output.weightF16[5120 5120]
-
blk.45.attn_q.biasF32[5120]
-
blk.45.attn_q.weightF16[5120 5120]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightF16[5120 1024]
-
blk.46.ffn_gate.weightF16[5120 27392]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightF16[5120 1024]
-
blk.46.attn_output.weightF16[5120 5120]
-
blk.46.attn_q.biasF32[5120]
-
blk.46.attn_q.weightF16[5120 5120]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightF16[5120 1024]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightF16[27392 5120]
-
blk.46.ffn_up.weightF16[5120 27392]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightF16[27392 5120]
-
blk.47.ffn_gate.weightF16[5120 27392]
-
blk.47.ffn_up.weightF16[5120 27392]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightF16[5120 1024]
-
blk.47.attn_output.weightF16[5120 5120]
-
blk.47.attn_q.biasF32[5120]
-
blk.47.attn_q.weightF16[5120 5120]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightF16[5120 1024]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightF16[27392 5120]
-
blk.48.ffn_gate.weightF16[5120 27392]
-
blk.48.ffn_up.weightF16[5120 27392]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightF16[5120 1024]
-
blk.48.attn_output.weightF16[5120 5120]
-
blk.48.attn_q.biasF32[5120]
-
blk.48.attn_q.weightF16[5120 5120]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightF16[5120 1024]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightF16[27392 5120]
-
blk.49.ffn_gate.weightF16[5120 27392]
-
blk.49.ffn_up.weightF16[5120 27392]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightF16[5120 1024]
-
blk.49.attn_output.weightF16[5120 5120]
-
blk.49.attn_q.biasF32[5120]
-
blk.49.attn_q.weightF16[5120 5120]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightF16[5120 1024]
-
blk.50.ffn_gate.weightF16[5120 27392]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightF16[5120 1024]
-
blk.50.attn_output.weightF16[5120 5120]
-
blk.50.attn_q.biasF32[5120]
-
blk.50.attn_q.weightF16[5120 5120]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightF16[5120 1024]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightF16[27392 5120]
-
blk.50.ffn_up.weightF16[5120 27392]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightF16[27392 5120]
-
blk.51.ffn_gate.weightF16[5120 27392]
-
blk.51.ffn_up.weightF16[5120 27392]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightF16[5120 1024]
-
blk.51.attn_output.weightF16[5120 5120]
-
blk.51.attn_q.biasF32[5120]
-
blk.51.attn_q.weightF16[5120 5120]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightF16[5120 1024]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightF16[27392 5120]
-
blk.52.ffn_gate.weightF16[5120 27392]
-
blk.52.ffn_up.weightF16[5120 27392]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightF16[5120 1024]
-
blk.52.attn_output.weightF16[5120 5120]
-
blk.52.attn_q.biasF32[5120]
-
blk.52.attn_q.weightF16[5120 5120]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightF16[5120 1024]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightF16[27392 5120]
-
blk.53.ffn_gate.weightF16[5120 27392]
-
blk.53.ffn_up.weightF16[5120 27392]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightF16[5120 1024]
-
blk.53.attn_output.weightF16[5120 5120]
-
blk.53.attn_q.biasF32[5120]
-
blk.53.attn_q.weightF16[5120 5120]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightF16[5120 1024]
-
blk.54.ffn_gate.weightF16[5120 27392]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightF16[5120 1024]
-
blk.54.attn_output.weightF16[5120 5120]
-
blk.54.attn_q.biasF32[5120]
-
blk.54.attn_q.weightF16[5120 5120]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightF16[5120 1024]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightF16[27392 5120]
-
blk.54.ffn_up.weightF16[5120 27392]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightF16[27392 5120]
-
blk.55.ffn_gate.weightF16[5120 27392]
-
blk.55.ffn_up.weightF16[5120 27392]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightF16[5120 1024]
-
blk.55.attn_output.weightF16[5120 5120]
-
blk.55.attn_q.biasF32[5120]
-
blk.55.attn_q.weightF16[5120 5120]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightF16[5120 1024]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightF16[27392 5120]
-
blk.56.ffn_gate.weightF16[5120 27392]
-
blk.56.ffn_up.weightF16[5120 27392]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightF16[5120 1024]
-
blk.56.attn_output.weightF16[5120 5120]
-
blk.56.attn_q.biasF32[5120]
-
blk.56.attn_q.weightF16[5120 5120]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightF16[5120 1024]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightF16[27392 5120]
-
blk.57.ffn_gate.weightF16[5120 27392]
-
blk.57.ffn_up.weightF16[5120 27392]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightF16[5120 1024]
-
blk.57.attn_output.weightF16[5120 5120]
-
blk.57.attn_q.biasF32[5120]
-
blk.57.attn_q.weightF16[5120 5120]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightF16[5120 1024]
-
blk.58.ffn_gate.weightF16[5120 27392]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightF16[5120 1024]
-
blk.58.attn_output.weightF16[5120 5120]
-
blk.58.attn_q.biasF32[5120]
-
blk.58.attn_q.weightF16[5120 5120]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightF16[5120 1024]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightF16[27392 5120]
-
blk.58.ffn_up.weightF16[5120 27392]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightF16[27392 5120]
-
blk.59.ffn_gate.weightF16[5120 27392]
-
blk.59.ffn_up.weightF16[5120 27392]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightF16[5120 1024]
-
blk.59.attn_output.weightF16[5120 5120]
-
blk.59.attn_q.biasF32[5120]
-
blk.59.attn_q.weightF16[5120 5120]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightF16[5120 1024]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightF16[27392 5120]
-
blk.60.ffn_gate.weightF16[5120 27392]
-
blk.60.ffn_up.weightF16[5120 27392]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightF16[5120 1024]
-
blk.60.attn_output.weightF16[5120 5120]
-
blk.60.attn_q.biasF32[5120]
-
blk.60.attn_q.weightF16[5120 5120]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightF16[5120 1024]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightF16[27392 5120]
-
blk.61.ffn_gate.weightF16[5120 27392]
-
blk.61.ffn_up.weightF16[5120 27392]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightF16[5120 1024]
-
blk.61.attn_output.weightF16[5120 5120]
-
blk.61.attn_q.biasF32[5120]
-
blk.61.attn_q.weightF16[5120 5120]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightF16[5120 1024]
-
blk.62.ffn_gate.weightF16[5120 27392]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightF16[5120 1024]
-
blk.62.attn_output.weightF16[5120 5120]
-
blk.62.attn_q.biasF32[5120]
-
blk.62.attn_q.weightF16[5120 5120]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightF16[5120 1024]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightF16[27392 5120]
-
blk.62.ffn_up.weightF16[5120 27392]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightF16[27392 5120]
-
blk.63.ffn_gate.weightF16[5120 27392]
-
blk.63.ffn_up.weightF16[5120 27392]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightF16[5120 1024]
-
blk.63.attn_output.weightF16[5120 5120]
-
blk.63.attn_q.biasF32[5120]
-
blk.63.attn_q.weightF16[5120 5120]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightF16[5120 1024]
-
output.weightF16[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63