latest
4.2GB
3B
69 Pulls Updated 3 months ago
efb12d53ab89 · 4.2GB
-
general.architecturellama
-
general.file_typeQ8_0
-
llama.attention.head_count20
-
llama.attention.head_count_kv20
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count40
-
llama.context_length32768
-
llama.embedding_length2560
-
llama.feed_forward_length6912
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
llama.vocab_size151936
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151643
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ8_0[2560 151936]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_down.weightQ8_0[6912 2560]
-
blk.0.ffn_gate.weightQ8_0[2560 6912]
-
blk.0.ffn_up.weightQ8_0[2560 6912]
-
blk.0.ffn_norm.weightF32[2560]
-
blk.0.attn_k.biasF32[2560]
-
blk.0.attn_k.weightQ8_0[2560 2560]
-
blk.0.attn_output.weightQ8_0[2560 2560]
-
blk.0.attn_q.biasF32[2560]
-
blk.0.attn_q.weightQ8_0[2560 2560]
-
blk.0.attn_v.biasF32[2560]
-
blk.0.attn_v.weightQ8_0[2560 2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_down.weightQ8_0[6912 2560]
-
blk.1.ffn_gate.weightQ8_0[2560 6912]
-
blk.1.ffn_up.weightQ8_0[2560 6912]
-
blk.1.ffn_norm.weightF32[2560]
-
blk.1.attn_k.biasF32[2560]
-
blk.1.attn_k.weightQ8_0[2560 2560]
-
blk.1.attn_output.weightQ8_0[2560 2560]
-
blk.1.attn_q.biasF32[2560]
-
blk.1.attn_q.weightQ8_0[2560 2560]
-
blk.1.attn_v.biasF32[2560]
-
blk.1.attn_v.weightQ8_0[2560 2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_down.weightQ8_0[6912 2560]
-
blk.2.ffn_gate.weightQ8_0[2560 6912]
-
blk.2.ffn_up.weightQ8_0[2560 6912]
-
blk.2.ffn_norm.weightF32[2560]
-
blk.2.attn_k.biasF32[2560]
-
blk.2.attn_k.weightQ8_0[2560 2560]
-
blk.2.attn_output.weightQ8_0[2560 2560]
-
blk.2.attn_q.biasF32[2560]
-
blk.2.attn_q.weightQ8_0[2560 2560]
-
blk.2.attn_v.biasF32[2560]
-
blk.2.attn_v.weightQ8_0[2560 2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_down.weightQ8_0[6912 2560]
-
blk.3.ffn_gate.weightQ8_0[2560 6912]
-
blk.3.ffn_up.weightQ8_0[2560 6912]
-
blk.3.ffn_norm.weightF32[2560]
-
blk.3.attn_k.biasF32[2560]
-
blk.3.attn_k.weightQ8_0[2560 2560]
-
blk.3.attn_output.weightQ8_0[2560 2560]
-
blk.3.attn_q.biasF32[2560]
-
blk.3.attn_q.weightQ8_0[2560 2560]
-
blk.3.attn_v.biasF32[2560]
-
blk.3.attn_v.weightQ8_0[2560 2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_down.weightQ8_0[6912 2560]
-
blk.4.ffn_gate.weightQ8_0[2560 6912]
-
blk.4.ffn_up.weightQ8_0[2560 6912]
-
blk.4.ffn_norm.weightF32[2560]
-
blk.4.attn_k.biasF32[2560]
-
blk.4.attn_k.weightQ8_0[2560 2560]
-
blk.4.attn_output.weightQ8_0[2560 2560]
-
blk.4.attn_q.biasF32[2560]
-
blk.4.attn_q.weightQ8_0[2560 2560]
-
blk.4.attn_v.biasF32[2560]
-
blk.4.attn_v.weightQ8_0[2560 2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_down.weightQ8_0[6912 2560]
-
blk.5.ffn_gate.weightQ8_0[2560 6912]
-
blk.5.ffn_up.weightQ8_0[2560 6912]
-
blk.5.ffn_norm.weightF32[2560]
-
blk.5.attn_k.biasF32[2560]
-
blk.5.attn_k.weightQ8_0[2560 2560]
-
blk.5.attn_output.weightQ8_0[2560 2560]
-
blk.5.attn_q.biasF32[2560]
-
blk.5.attn_q.weightQ8_0[2560 2560]
-
blk.5.attn_v.biasF32[2560]
-
blk.5.attn_v.weightQ8_0[2560 2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_down.weightQ8_0[6912 2560]
-
blk.6.ffn_gate.weightQ8_0[2560 6912]
-
blk.6.ffn_up.weightQ8_0[2560 6912]
-
blk.6.ffn_norm.weightF32[2560]
-
blk.6.attn_k.biasF32[2560]
-
blk.6.attn_k.weightQ8_0[2560 2560]
-
blk.6.attn_output.weightQ8_0[2560 2560]
-
blk.6.attn_q.biasF32[2560]
-
blk.6.attn_q.weightQ8_0[2560 2560]
-
blk.6.attn_v.biasF32[2560]
-
blk.6.attn_v.weightQ8_0[2560 2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_down.weightQ8_0[6912 2560]
-
blk.7.ffn_gate.weightQ8_0[2560 6912]
-
blk.7.ffn_up.weightQ8_0[2560 6912]
-
blk.7.ffn_norm.weightF32[2560]
-
blk.7.attn_k.biasF32[2560]
-
blk.7.attn_k.weightQ8_0[2560 2560]
-
blk.7.attn_output.weightQ8_0[2560 2560]
-
blk.7.attn_q.biasF32[2560]
-
blk.7.attn_q.weightQ8_0[2560 2560]
-
blk.7.attn_v.biasF32[2560]
-
blk.7.attn_v.weightQ8_0[2560 2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_down.weightQ8_0[6912 2560]
-
blk.8.ffn_gate.weightQ8_0[2560 6912]
-
blk.8.ffn_up.weightQ8_0[2560 6912]
-
blk.8.ffn_norm.weightF32[2560]
-
blk.8.attn_k.biasF32[2560]
-
blk.8.attn_k.weightQ8_0[2560 2560]
-
blk.8.attn_output.weightQ8_0[2560 2560]
-
blk.8.attn_q.biasF32[2560]
-
blk.8.attn_q.weightQ8_0[2560 2560]
-
blk.8.attn_v.biasF32[2560]
-
blk.8.attn_v.weightQ8_0[2560 2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_down.weightQ8_0[6912 2560]
-
blk.9.ffn_gate.weightQ8_0[2560 6912]
-
blk.9.ffn_up.weightQ8_0[2560 6912]
-
blk.9.ffn_norm.weightF32[2560]
-
blk.9.attn_k.biasF32[2560]
-
blk.9.attn_k.weightQ8_0[2560 2560]
-
blk.9.attn_output.weightQ8_0[2560 2560]
-
blk.9.attn_q.biasF32[2560]
-
blk.9.attn_q.weightQ8_0[2560 2560]
-
blk.9.attn_v.biasF32[2560]
-
blk.9.attn_v.weightQ8_0[2560 2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_down.weightQ8_0[6912 2560]
-
blk.10.ffn_gate.weightQ8_0[2560 6912]
-
blk.10.ffn_up.weightQ8_0[2560 6912]
-
blk.10.ffn_norm.weightF32[2560]
-
blk.10.attn_k.biasF32[2560]
-
blk.10.attn_k.weightQ8_0[2560 2560]
-
blk.10.attn_output.weightQ8_0[2560 2560]
-
blk.10.attn_q.biasF32[2560]
-
blk.10.attn_q.weightQ8_0[2560 2560]
-
blk.10.attn_v.biasF32[2560]
-
blk.10.attn_v.weightQ8_0[2560 2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_down.weightQ8_0[6912 2560]
-
blk.11.ffn_gate.weightQ8_0[2560 6912]
-
blk.11.ffn_up.weightQ8_0[2560 6912]
-
blk.11.ffn_norm.weightF32[2560]
-
blk.11.attn_k.biasF32[2560]
-
blk.11.attn_k.weightQ8_0[2560 2560]
-
blk.11.attn_output.weightQ8_0[2560 2560]
-
blk.11.attn_q.biasF32[2560]
-
blk.11.attn_q.weightQ8_0[2560 2560]
-
blk.11.attn_v.biasF32[2560]
-
blk.11.attn_v.weightQ8_0[2560 2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_down.weightQ8_0[6912 2560]
-
blk.12.ffn_gate.weightQ8_0[2560 6912]
-
blk.12.ffn_up.weightQ8_0[2560 6912]
-
blk.12.ffn_norm.weightF32[2560]
-
blk.12.attn_k.biasF32[2560]
-
blk.12.attn_k.weightQ8_0[2560 2560]
-
blk.12.attn_output.weightQ8_0[2560 2560]
-
blk.12.attn_q.biasF32[2560]
-
blk.12.attn_q.weightQ8_0[2560 2560]
-
blk.12.attn_v.biasF32[2560]
-
blk.12.attn_v.weightQ8_0[2560 2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_down.weightQ8_0[6912 2560]
-
blk.13.ffn_gate.weightQ8_0[2560 6912]
-
blk.13.ffn_up.weightQ8_0[2560 6912]
-
blk.13.ffn_norm.weightF32[2560]
-
blk.13.attn_k.biasF32[2560]
-
blk.13.attn_k.weightQ8_0[2560 2560]
-
blk.13.attn_output.weightQ8_0[2560 2560]
-
blk.13.attn_q.biasF32[2560]
-
blk.13.attn_q.weightQ8_0[2560 2560]
-
blk.13.attn_v.biasF32[2560]
-
blk.13.attn_v.weightQ8_0[2560 2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_down.weightQ8_0[6912 2560]
-
blk.14.ffn_gate.weightQ8_0[2560 6912]
-
blk.14.ffn_up.weightQ8_0[2560 6912]
-
blk.14.ffn_norm.weightF32[2560]
-
blk.14.attn_k.biasF32[2560]
-
blk.14.attn_k.weightQ8_0[2560 2560]
-
blk.14.attn_output.weightQ8_0[2560 2560]
-
blk.14.attn_q.biasF32[2560]
-
blk.14.attn_q.weightQ8_0[2560 2560]
-
blk.14.attn_v.biasF32[2560]
-
blk.14.attn_v.weightQ8_0[2560 2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_down.weightQ8_0[6912 2560]
-
blk.15.ffn_gate.weightQ8_0[2560 6912]
-
blk.15.ffn_up.weightQ8_0[2560 6912]
-
blk.15.ffn_norm.weightF32[2560]
-
blk.15.attn_k.biasF32[2560]
-
blk.15.attn_k.weightQ8_0[2560 2560]
-
blk.15.attn_output.weightQ8_0[2560 2560]
-
blk.15.attn_q.biasF32[2560]
-
blk.15.attn_q.weightQ8_0[2560 2560]
-
blk.15.attn_v.biasF32[2560]
-
blk.15.attn_v.weightQ8_0[2560 2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_down.weightQ8_0[6912 2560]
-
blk.16.ffn_gate.weightQ8_0[2560 6912]
-
blk.16.ffn_up.weightQ8_0[2560 6912]
-
blk.16.ffn_norm.weightF32[2560]
-
blk.16.attn_k.biasF32[2560]
-
blk.16.attn_k.weightQ8_0[2560 2560]
-
blk.16.attn_output.weightQ8_0[2560 2560]
-
blk.16.attn_q.biasF32[2560]
-
blk.16.attn_q.weightQ8_0[2560 2560]
-
blk.16.attn_v.biasF32[2560]
-
blk.16.attn_v.weightQ8_0[2560 2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_down.weightQ8_0[6912 2560]
-
blk.17.ffn_gate.weightQ8_0[2560 6912]
-
blk.17.ffn_up.weightQ8_0[2560 6912]
-
blk.17.ffn_norm.weightF32[2560]
-
blk.17.attn_k.biasF32[2560]
-
blk.17.attn_k.weightQ8_0[2560 2560]
-
blk.17.attn_output.weightQ8_0[2560 2560]
-
blk.17.attn_q.biasF32[2560]
-
blk.17.attn_q.weightQ8_0[2560 2560]
-
blk.17.attn_v.biasF32[2560]
-
blk.17.attn_v.weightQ8_0[2560 2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_down.weightQ8_0[6912 2560]
-
blk.18.ffn_gate.weightQ8_0[2560 6912]
-
blk.18.ffn_up.weightQ8_0[2560 6912]
-
blk.18.ffn_norm.weightF32[2560]
-
blk.18.attn_k.biasF32[2560]
-
blk.18.attn_k.weightQ8_0[2560 2560]
-
blk.18.attn_output.weightQ8_0[2560 2560]
-
blk.18.attn_q.biasF32[2560]
-
blk.18.attn_q.weightQ8_0[2560 2560]
-
blk.18.attn_v.biasF32[2560]
-
blk.18.attn_v.weightQ8_0[2560 2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_down.weightQ8_0[6912 2560]
-
blk.19.ffn_gate.weightQ8_0[2560 6912]
-
blk.19.ffn_up.weightQ8_0[2560 6912]
-
blk.19.ffn_norm.weightF32[2560]
-
blk.19.attn_k.biasF32[2560]
-
blk.19.attn_k.weightQ8_0[2560 2560]
-
blk.19.attn_output.weightQ8_0[2560 2560]
-
blk.19.attn_q.biasF32[2560]
-
blk.19.attn_q.weightQ8_0[2560 2560]
-
blk.19.attn_v.biasF32[2560]
-
blk.19.attn_v.weightQ8_0[2560 2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_down.weightQ8_0[6912 2560]
-
blk.20.ffn_gate.weightQ8_0[2560 6912]
-
blk.20.ffn_up.weightQ8_0[2560 6912]
-
blk.20.ffn_norm.weightF32[2560]
-
blk.20.attn_k.biasF32[2560]
-
blk.20.attn_k.weightQ8_0[2560 2560]
-
blk.20.attn_output.weightQ8_0[2560 2560]
-
blk.20.attn_q.biasF32[2560]
-
blk.20.attn_q.weightQ8_0[2560 2560]
-
blk.20.attn_v.biasF32[2560]
-
blk.20.attn_v.weightQ8_0[2560 2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_down.weightQ8_0[6912 2560]
-
blk.21.ffn_gate.weightQ8_0[2560 6912]
-
blk.21.ffn_up.weightQ8_0[2560 6912]
-
blk.21.ffn_norm.weightF32[2560]
-
blk.21.attn_k.biasF32[2560]
-
blk.21.attn_k.weightQ8_0[2560 2560]
-
blk.21.attn_output.weightQ8_0[2560 2560]
-
blk.21.attn_q.biasF32[2560]
-
blk.21.attn_q.weightQ8_0[2560 2560]
-
blk.21.attn_v.biasF32[2560]
-
blk.21.attn_v.weightQ8_0[2560 2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_down.weightQ8_0[6912 2560]
-
blk.22.ffn_gate.weightQ8_0[2560 6912]
-
blk.22.ffn_up.weightQ8_0[2560 6912]
-
blk.22.ffn_norm.weightF32[2560]
-
blk.22.attn_k.biasF32[2560]
-
blk.22.attn_k.weightQ8_0[2560 2560]
-
blk.22.attn_output.weightQ8_0[2560 2560]
-
blk.22.attn_q.biasF32[2560]
-
blk.22.attn_q.weightQ8_0[2560 2560]
-
blk.22.attn_v.biasF32[2560]
-
blk.22.attn_v.weightQ8_0[2560 2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_down.weightQ8_0[6912 2560]
-
blk.23.ffn_gate.weightQ8_0[2560 6912]
-
blk.23.ffn_up.weightQ8_0[2560 6912]
-
blk.23.ffn_norm.weightF32[2560]
-
blk.23.attn_k.biasF32[2560]
-
blk.23.attn_k.weightQ8_0[2560 2560]
-
blk.23.attn_output.weightQ8_0[2560 2560]
-
blk.23.attn_q.biasF32[2560]
-
blk.23.attn_q.weightQ8_0[2560 2560]
-
blk.23.attn_v.biasF32[2560]
-
blk.23.attn_v.weightQ8_0[2560 2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_down.weightQ8_0[6912 2560]
-
blk.24.ffn_gate.weightQ8_0[2560 6912]
-
blk.24.ffn_up.weightQ8_0[2560 6912]
-
blk.24.ffn_norm.weightF32[2560]
-
blk.24.attn_k.biasF32[2560]
-
blk.24.attn_k.weightQ8_0[2560 2560]
-
blk.24.attn_output.weightQ8_0[2560 2560]
-
blk.24.attn_q.biasF32[2560]
-
blk.24.attn_q.weightQ8_0[2560 2560]
-
blk.24.attn_v.biasF32[2560]
-
blk.24.attn_v.weightQ8_0[2560 2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_down.weightQ8_0[6912 2560]
-
blk.25.ffn_gate.weightQ8_0[2560 6912]
-
blk.25.ffn_up.weightQ8_0[2560 6912]
-
blk.25.ffn_norm.weightF32[2560]
-
blk.25.attn_k.biasF32[2560]
-
blk.25.attn_k.weightQ8_0[2560 2560]
-
blk.25.attn_output.weightQ8_0[2560 2560]
-
blk.25.attn_q.biasF32[2560]
-
blk.25.attn_q.weightQ8_0[2560 2560]
-
blk.25.attn_v.biasF32[2560]
-
blk.25.attn_v.weightQ8_0[2560 2560]
-
blk.26.ffn_gate.weightQ8_0[2560 6912]
-
blk.26.attn_k.biasF32[2560]
-
blk.26.attn_k.weightQ8_0[2560 2560]
-
blk.26.attn_output.weightQ8_0[2560 2560]
-
blk.26.attn_q.biasF32[2560]
-
blk.26.attn_q.weightQ8_0[2560 2560]
-
blk.26.attn_v.biasF32[2560]
-
blk.26.attn_v.weightQ8_0[2560 2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_down.weightQ8_0[6912 2560]
-
blk.26.ffn_up.weightQ8_0[2560 6912]
-
blk.26.ffn_norm.weightF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_down.weightQ8_0[6912 2560]
-
blk.27.ffn_gate.weightQ8_0[2560 6912]
-
blk.27.ffn_up.weightQ8_0[2560 6912]
-
blk.27.ffn_norm.weightF32[2560]
-
blk.27.attn_k.biasF32[2560]
-
blk.27.attn_k.weightQ8_0[2560 2560]
-
blk.27.attn_output.weightQ8_0[2560 2560]
-
blk.27.attn_q.biasF32[2560]
-
blk.27.attn_q.weightQ8_0[2560 2560]
-
blk.27.attn_v.biasF32[2560]
-
blk.27.attn_v.weightQ8_0[2560 2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_down.weightQ8_0[6912 2560]
-
blk.28.ffn_gate.weightQ8_0[2560 6912]
-
blk.28.ffn_up.weightQ8_0[2560 6912]
-
blk.28.ffn_norm.weightF32[2560]
-
blk.28.attn_k.biasF32[2560]
-
blk.28.attn_k.weightQ8_0[2560 2560]
-
blk.28.attn_output.weightQ8_0[2560 2560]
-
blk.28.attn_q.biasF32[2560]
-
blk.28.attn_q.weightQ8_0[2560 2560]
-
blk.28.attn_v.biasF32[2560]
-
blk.28.attn_v.weightQ8_0[2560 2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_down.weightQ8_0[6912 2560]
-
blk.29.ffn_gate.weightQ8_0[2560 6912]
-
blk.29.ffn_up.weightQ8_0[2560 6912]
-
blk.29.ffn_norm.weightF32[2560]
-
blk.29.attn_k.biasF32[2560]
-
blk.29.attn_k.weightQ8_0[2560 2560]
-
blk.29.attn_output.weightQ8_0[2560 2560]
-
blk.29.attn_q.biasF32[2560]
-
blk.29.attn_q.weightQ8_0[2560 2560]
-
blk.29.attn_v.biasF32[2560]
-
blk.29.attn_v.weightQ8_0[2560 2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_down.weightQ8_0[6912 2560]
-
blk.30.ffn_gate.weightQ8_0[2560 6912]
-
blk.30.ffn_up.weightQ8_0[2560 6912]
-
blk.30.ffn_norm.weightF32[2560]
-
blk.30.attn_k.biasF32[2560]
-
blk.30.attn_k.weightQ8_0[2560 2560]
-
blk.30.attn_output.weightQ8_0[2560 2560]
-
blk.30.attn_q.biasF32[2560]
-
blk.30.attn_q.weightQ8_0[2560 2560]
-
blk.30.attn_v.biasF32[2560]
-
blk.30.attn_v.weightQ8_0[2560 2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_down.weightQ8_0[6912 2560]
-
blk.31.ffn_gate.weightQ8_0[2560 6912]
-
blk.31.ffn_up.weightQ8_0[2560 6912]
-
blk.31.ffn_norm.weightF32[2560]
-
blk.31.attn_k.biasF32[2560]
-
blk.31.attn_k.weightQ8_0[2560 2560]
-
blk.31.attn_output.weightQ8_0[2560 2560]
-
blk.31.attn_q.biasF32[2560]
-
blk.31.attn_q.weightQ8_0[2560 2560]
-
blk.31.attn_v.biasF32[2560]
-
blk.31.attn_v.weightQ8_0[2560 2560]
-
blk.32.attn_norm.weightF32[2560]
-
blk.32.ffn_down.weightQ8_0[6912 2560]
-
blk.32.ffn_gate.weightQ8_0[2560 6912]
-
blk.32.ffn_up.weightQ8_0[2560 6912]
-
blk.32.ffn_norm.weightF32[2560]
-
blk.32.attn_k.biasF32[2560]
-
blk.32.attn_k.weightQ8_0[2560 2560]
-
blk.32.attn_output.weightQ8_0[2560 2560]
-
blk.32.attn_q.biasF32[2560]
-
blk.32.attn_q.weightQ8_0[2560 2560]
-
blk.32.attn_v.biasF32[2560]
-
blk.32.attn_v.weightQ8_0[2560 2560]
-
blk.33.attn_norm.weightF32[2560]
-
blk.33.ffn_down.weightQ8_0[6912 2560]
-
blk.33.ffn_gate.weightQ8_0[2560 6912]
-
blk.33.ffn_up.weightQ8_0[2560 6912]
-
blk.33.ffn_norm.weightF32[2560]
-
blk.33.attn_k.biasF32[2560]
-
blk.33.attn_k.weightQ8_0[2560 2560]
-
blk.33.attn_output.weightQ8_0[2560 2560]
-
blk.33.attn_q.biasF32[2560]
-
blk.33.attn_q.weightQ8_0[2560 2560]
-
blk.33.attn_v.biasF32[2560]
-
blk.33.attn_v.weightQ8_0[2560 2560]
-
blk.34.attn_norm.weightF32[2560]
-
blk.34.ffn_down.weightQ8_0[6912 2560]
-
blk.34.ffn_gate.weightQ8_0[2560 6912]
-
blk.34.ffn_up.weightQ8_0[2560 6912]
-
blk.34.ffn_norm.weightF32[2560]
-
blk.34.attn_k.biasF32[2560]
-
blk.34.attn_k.weightQ8_0[2560 2560]
-
blk.34.attn_output.weightQ8_0[2560 2560]
-
blk.34.attn_q.biasF32[2560]
-
blk.34.attn_q.weightQ8_0[2560 2560]
-
blk.34.attn_v.biasF32[2560]
-
blk.34.attn_v.weightQ8_0[2560 2560]
-
blk.35.attn_norm.weightF32[2560]
-
blk.35.ffn_down.weightQ8_0[6912 2560]
-
blk.35.ffn_gate.weightQ8_0[2560 6912]
-
blk.35.ffn_up.weightQ8_0[2560 6912]
-
blk.35.ffn_norm.weightF32[2560]
-
blk.35.attn_k.biasF32[2560]
-
blk.35.attn_k.weightQ8_0[2560 2560]
-
blk.35.attn_output.weightQ8_0[2560 2560]
-
blk.35.attn_q.biasF32[2560]
-
blk.35.attn_q.weightQ8_0[2560 2560]
-
blk.35.attn_v.biasF32[2560]
-
blk.35.attn_v.weightQ8_0[2560 2560]
-
blk.36.attn_norm.weightF32[2560]
-
blk.36.ffn_down.weightQ8_0[6912 2560]
-
blk.36.ffn_gate.weightQ8_0[2560 6912]
-
blk.36.ffn_up.weightQ8_0[2560 6912]
-
blk.36.ffn_norm.weightF32[2560]
-
blk.36.attn_k.biasF32[2560]
-
blk.36.attn_k.weightQ8_0[2560 2560]
-
blk.36.attn_output.weightQ8_0[2560 2560]
-
blk.36.attn_q.biasF32[2560]
-
blk.36.attn_q.weightQ8_0[2560 2560]
-
blk.36.attn_v.biasF32[2560]
-
blk.36.attn_v.weightQ8_0[2560 2560]
-
blk.37.attn_norm.weightF32[2560]
-
blk.37.ffn_down.weightQ8_0[6912 2560]
-
blk.37.ffn_gate.weightQ8_0[2560 6912]
-
blk.37.ffn_up.weightQ8_0[2560 6912]
-
blk.37.ffn_norm.weightF32[2560]
-
blk.37.attn_k.biasF32[2560]
-
blk.37.attn_k.weightQ8_0[2560 2560]
-
blk.37.attn_output.weightQ8_0[2560 2560]
-
blk.37.attn_q.biasF32[2560]
-
blk.37.attn_q.weightQ8_0[2560 2560]
-
blk.37.attn_v.biasF32[2560]
-
blk.37.attn_v.weightQ8_0[2560 2560]
-
blk.38.attn_norm.weightF32[2560]
-
blk.38.ffn_down.weightQ8_0[6912 2560]
-
blk.38.ffn_gate.weightQ8_0[2560 6912]
-
blk.38.ffn_up.weightQ8_0[2560 6912]
-
blk.38.ffn_norm.weightF32[2560]
-
blk.38.attn_k.biasF32[2560]
-
blk.38.attn_k.weightQ8_0[2560 2560]
-
blk.38.attn_output.weightQ8_0[2560 2560]
-
blk.38.attn_q.biasF32[2560]
-
blk.38.attn_q.weightQ8_0[2560 2560]
-
blk.38.attn_v.biasF32[2560]
-
blk.38.attn_v.weightQ8_0[2560 2560]
-
blk.39.attn_norm.weightF32[2560]
-
blk.39.ffn_down.weightQ8_0[6912 2560]
-
blk.39.ffn_gate.weightQ8_0[2560 6912]
-
blk.39.ffn_up.weightQ8_0[2560 6912]
-
blk.39.ffn_norm.weightF32[2560]
-
blk.39.attn_k.biasF32[2560]
-
blk.39.attn_k.weightQ8_0[2560 2560]
-
blk.39.attn_output.weightQ8_0[2560 2560]
-
blk.39.attn_q.biasF32[2560]
-
blk.39.attn_q.weightQ8_0[2560 2560]
-
blk.39.attn_v.biasF32[2560]
-
blk.39.attn_v.weightQ8_0[2560 2560]
-
output.weightQ8_0[2560 151936]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39