With correct 16k context window
33B
73 Pulls Updated 3 months ago
d9726a3c89a4 · 35GB
-
general.architecturellama
-
general.file_typeQ8_0
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count62
-
llama.context_length16384
-
llama.embedding_length7168
-
llama.feed_forward_length19200
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32021
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ8_0[7168 32256]
-
blk.0.attn_q.weightQ8_0[7168 7168]
-
blk.0.attn_k.weightQ8_0[7168 1024]
-
blk.0.attn_v.weightQ8_0[7168 1024]
-
blk.0.attn_output.weightQ8_0[7168 7168]
-
blk.0.ffn_gate.weightQ8_0[7168 19200]
-
blk.0.ffn_up.weightQ8_0[7168 19200]
-
blk.0.ffn_down.weightQ8_0[19200 7168]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.1.attn_q.weightQ8_0[7168 7168]
-
blk.1.attn_k.weightQ8_0[7168 1024]
-
blk.1.attn_v.weightQ8_0[7168 1024]
-
blk.1.attn_output.weightQ8_0[7168 7168]
-
blk.1.ffn_gate.weightQ8_0[7168 19200]
-
blk.1.ffn_up.weightQ8_0[7168 19200]
-
blk.1.ffn_down.weightQ8_0[19200 7168]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.2.attn_q.weightQ8_0[7168 7168]
-
blk.2.attn_k.weightQ8_0[7168 1024]
-
blk.2.attn_v.weightQ8_0[7168 1024]
-
blk.2.attn_output.weightQ8_0[7168 7168]
-
blk.2.ffn_gate.weightQ8_0[7168 19200]
-
blk.2.ffn_up.weightQ8_0[7168 19200]
-
blk.2.ffn_down.weightQ8_0[19200 7168]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.3.attn_q.weightQ8_0[7168 7168]
-
blk.3.attn_k.weightQ8_0[7168 1024]
-
blk.3.attn_v.weightQ8_0[7168 1024]
-
blk.3.attn_output.weightQ8_0[7168 7168]
-
blk.3.ffn_gate.weightQ8_0[7168 19200]
-
blk.3.ffn_up.weightQ8_0[7168 19200]
-
blk.3.ffn_down.weightQ8_0[19200 7168]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_q.weightQ8_0[7168 7168]
-
blk.4.attn_k.weightQ8_0[7168 1024]
-
blk.4.attn_v.weightQ8_0[7168 1024]
-
blk.4.attn_output.weightQ8_0[7168 7168]
-
blk.4.ffn_gate.weightQ8_0[7168 19200]
-
blk.4.ffn_up.weightQ8_0[7168 19200]
-
blk.4.ffn_down.weightQ8_0[19200 7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.5.attn_q.weightQ8_0[7168 7168]
-
blk.5.attn_k.weightQ8_0[7168 1024]
-
blk.5.attn_v.weightQ8_0[7168 1024]
-
blk.5.attn_output.weightQ8_0[7168 7168]
-
blk.5.ffn_gate.weightQ8_0[7168 19200]
-
blk.5.ffn_up.weightQ8_0[7168 19200]
-
blk.5.ffn_down.weightQ8_0[19200 7168]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.6.attn_q.weightQ8_0[7168 7168]
-
blk.6.attn_k.weightQ8_0[7168 1024]
-
blk.6.attn_v.weightQ8_0[7168 1024]
-
blk.6.attn_output.weightQ8_0[7168 7168]
-
blk.6.ffn_gate.weightQ8_0[7168 19200]
-
blk.6.ffn_up.weightQ8_0[7168 19200]
-
blk.6.ffn_down.weightQ8_0[19200 7168]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.7.attn_q.weightQ8_0[7168 7168]
-
blk.7.attn_k.weightQ8_0[7168 1024]
-
blk.7.attn_v.weightQ8_0[7168 1024]
-
blk.7.attn_output.weightQ8_0[7168 7168]
-
blk.7.ffn_gate.weightQ8_0[7168 19200]
-
blk.7.ffn_up.weightQ8_0[7168 19200]
-
blk.7.ffn_down.weightQ8_0[19200 7168]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_q.weightQ8_0[7168 7168]
-
blk.8.attn_k.weightQ8_0[7168 1024]
-
blk.8.attn_v.weightQ8_0[7168 1024]
-
blk.8.attn_output.weightQ8_0[7168 7168]
-
blk.8.ffn_gate.weightQ8_0[7168 19200]
-
blk.8.ffn_up.weightQ8_0[7168 19200]
-
blk.8.ffn_down.weightQ8_0[19200 7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.9.attn_q.weightQ8_0[7168 7168]
-
blk.9.attn_k.weightQ8_0[7168 1024]
-
blk.9.attn_v.weightQ8_0[7168 1024]
-
blk.9.attn_output.weightQ8_0[7168 7168]
-
blk.9.ffn_gate.weightQ8_0[7168 19200]
-
blk.9.ffn_up.weightQ8_0[7168 19200]
-
blk.9.ffn_down.weightQ8_0[19200 7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.10.attn_q.weightQ8_0[7168 7168]
-
blk.10.attn_k.weightQ8_0[7168 1024]
-
blk.10.attn_v.weightQ8_0[7168 1024]
-
blk.10.attn_output.weightQ8_0[7168 7168]
-
blk.10.ffn_gate.weightQ8_0[7168 19200]
-
blk.10.ffn_up.weightQ8_0[7168 19200]
-
blk.10.ffn_down.weightQ8_0[19200 7168]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.11.attn_q.weightQ8_0[7168 7168]
-
blk.11.attn_k.weightQ8_0[7168 1024]
-
blk.11.attn_v.weightQ8_0[7168 1024]
-
blk.11.attn_output.weightQ8_0[7168 7168]
-
blk.11.ffn_gate.weightQ8_0[7168 19200]
-
blk.11.ffn_up.weightQ8_0[7168 19200]
-
blk.11.ffn_down.weightQ8_0[19200 7168]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.12.attn_q.weightQ8_0[7168 7168]
-
blk.12.attn_k.weightQ8_0[7168 1024]
-
blk.12.attn_v.weightQ8_0[7168 1024]
-
blk.12.attn_output.weightQ8_0[7168 7168]
-
blk.12.ffn_gate.weightQ8_0[7168 19200]
-
blk.12.ffn_up.weightQ8_0[7168 19200]
-
blk.12.ffn_down.weightQ8_0[19200 7168]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_q.weightQ8_0[7168 7168]
-
blk.13.attn_k.weightQ8_0[7168 1024]
-
blk.13.attn_v.weightQ8_0[7168 1024]
-
blk.13.attn_output.weightQ8_0[7168 7168]
-
blk.13.ffn_gate.weightQ8_0[7168 19200]
-
blk.13.ffn_up.weightQ8_0[7168 19200]
-
blk.13.ffn_down.weightQ8_0[19200 7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.14.attn_q.weightQ8_0[7168 7168]
-
blk.14.attn_k.weightQ8_0[7168 1024]
-
blk.14.attn_v.weightQ8_0[7168 1024]
-
blk.14.attn_output.weightQ8_0[7168 7168]
-
blk.14.ffn_gate.weightQ8_0[7168 19200]
-
blk.14.ffn_up.weightQ8_0[7168 19200]
-
blk.14.ffn_down.weightQ8_0[19200 7168]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.15.attn_q.weightQ8_0[7168 7168]
-
blk.15.attn_k.weightQ8_0[7168 1024]
-
blk.15.attn_v.weightQ8_0[7168 1024]
-
blk.15.attn_output.weightQ8_0[7168 7168]
-
blk.15.ffn_gate.weightQ8_0[7168 19200]
-
blk.15.ffn_up.weightQ8_0[7168 19200]
-
blk.15.ffn_down.weightQ8_0[19200 7168]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.16.attn_q.weightQ8_0[7168 7168]
-
blk.16.attn_k.weightQ8_0[7168 1024]
-
blk.16.attn_v.weightQ8_0[7168 1024]
-
blk.16.attn_output.weightQ8_0[7168 7168]
-
blk.16.ffn_gate.weightQ8_0[7168 19200]
-
blk.16.ffn_up.weightQ8_0[7168 19200]
-
blk.16.ffn_down.weightQ8_0[19200 7168]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_q.weightQ8_0[7168 7168]
-
blk.17.attn_k.weightQ8_0[7168 1024]
-
blk.17.attn_v.weightQ8_0[7168 1024]
-
blk.17.attn_output.weightQ8_0[7168 7168]
-
blk.17.ffn_gate.weightQ8_0[7168 19200]
-
blk.17.ffn_up.weightQ8_0[7168 19200]
-
blk.17.ffn_down.weightQ8_0[19200 7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.18.attn_q.weightQ8_0[7168 7168]
-
blk.18.attn_k.weightQ8_0[7168 1024]
-
blk.18.attn_v.weightQ8_0[7168 1024]
-
blk.18.attn_output.weightQ8_0[7168 7168]
-
blk.18.ffn_gate.weightQ8_0[7168 19200]
-
blk.18.ffn_up.weightQ8_0[7168 19200]
-
blk.18.ffn_down.weightQ8_0[19200 7168]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.19.attn_q.weightQ8_0[7168 7168]
-
blk.19.attn_k.weightQ8_0[7168 1024]
-
blk.19.attn_v.weightQ8_0[7168 1024]
-
blk.19.attn_output.weightQ8_0[7168 7168]
-
blk.19.ffn_gate.weightQ8_0[7168 19200]
-
blk.19.ffn_up.weightQ8_0[7168 19200]
-
blk.19.ffn_down.weightQ8_0[19200 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.20.attn_q.weightQ8_0[7168 7168]
-
blk.20.attn_k.weightQ8_0[7168 1024]
-
blk.20.attn_v.weightQ8_0[7168 1024]
-
blk.20.attn_output.weightQ8_0[7168 7168]
-
blk.20.ffn_gate.weightQ8_0[7168 19200]
-
blk.20.ffn_up.weightQ8_0[7168 19200]
-
blk.20.ffn_down.weightQ8_0[19200 7168]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_q.weightQ8_0[7168 7168]
-
blk.21.attn_k.weightQ8_0[7168 1024]
-
blk.21.attn_v.weightQ8_0[7168 1024]
-
blk.21.attn_output.weightQ8_0[7168 7168]
-
blk.21.ffn_gate.weightQ8_0[7168 19200]
-
blk.21.ffn_up.weightQ8_0[7168 19200]
-
blk.21.ffn_down.weightQ8_0[19200 7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.22.attn_q.weightQ8_0[7168 7168]
-
blk.22.attn_k.weightQ8_0[7168 1024]
-
blk.22.attn_v.weightQ8_0[7168 1024]
-
blk.22.attn_output.weightQ8_0[7168 7168]
-
blk.22.ffn_gate.weightQ8_0[7168 19200]
-
blk.22.ffn_up.weightQ8_0[7168 19200]
-
blk.22.ffn_down.weightQ8_0[19200 7168]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.23.attn_q.weightQ8_0[7168 7168]
-
blk.23.attn_k.weightQ8_0[7168 1024]
-
blk.23.attn_v.weightQ8_0[7168 1024]
-
blk.23.attn_output.weightQ8_0[7168 7168]
-
blk.23.ffn_gate.weightQ8_0[7168 19200]
-
blk.23.ffn_up.weightQ8_0[7168 19200]
-
blk.23.ffn_down.weightQ8_0[19200 7168]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.24.attn_q.weightQ8_0[7168 7168]
-
blk.24.attn_k.weightQ8_0[7168 1024]
-
blk.24.attn_v.weightQ8_0[7168 1024]
-
blk.24.attn_output.weightQ8_0[7168 7168]
-
blk.24.ffn_gate.weightQ8_0[7168 19200]
-
blk.24.ffn_up.weightQ8_0[7168 19200]
-
blk.24.ffn_down.weightQ8_0[19200 7168]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.25.attn_q.weightQ8_0[7168 7168]
-
blk.25.attn_k.weightQ8_0[7168 1024]
-
blk.25.attn_v.weightQ8_0[7168 1024]
-
blk.25.attn_output.weightQ8_0[7168 7168]
-
blk.25.ffn_gate.weightQ8_0[7168 19200]
-
blk.25.ffn_up.weightQ8_0[7168 19200]
-
blk.25.ffn_down.weightQ8_0[19200 7168]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_q.weightQ8_0[7168 7168]
-
blk.26.attn_k.weightQ8_0[7168 1024]
-
blk.26.attn_v.weightQ8_0[7168 1024]
-
blk.26.attn_output.weightQ8_0[7168 7168]
-
blk.26.ffn_gate.weightQ8_0[7168 19200]
-
blk.26.ffn_up.weightQ8_0[7168 19200]
-
blk.26.ffn_down.weightQ8_0[19200 7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.27.attn_q.weightQ8_0[7168 7168]
-
blk.27.attn_k.weightQ8_0[7168 1024]
-
blk.27.attn_v.weightQ8_0[7168 1024]
-
blk.27.attn_output.weightQ8_0[7168 7168]
-
blk.27.ffn_gate.weightQ8_0[7168 19200]
-
blk.27.ffn_up.weightQ8_0[7168 19200]
-
blk.27.ffn_down.weightQ8_0[19200 7168]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.28.attn_q.weightQ8_0[7168 7168]
-
blk.28.attn_k.weightQ8_0[7168 1024]
-
blk.28.attn_v.weightQ8_0[7168 1024]
-
blk.28.attn_output.weightQ8_0[7168 7168]
-
blk.28.ffn_gate.weightQ8_0[7168 19200]
-
blk.28.ffn_up.weightQ8_0[7168 19200]
-
blk.28.ffn_down.weightQ8_0[19200 7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.29.attn_q.weightQ8_0[7168 7168]
-
blk.29.attn_k.weightQ8_0[7168 1024]
-
blk.29.attn_v.weightQ8_0[7168 1024]
-
blk.29.attn_output.weightQ8_0[7168 7168]
-
blk.29.ffn_gate.weightQ8_0[7168 19200]
-
blk.29.ffn_up.weightQ8_0[7168 19200]
-
blk.29.ffn_down.weightQ8_0[19200 7168]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_q.weightQ8_0[7168 7168]
-
blk.30.attn_k.weightQ8_0[7168 1024]
-
blk.30.attn_v.weightQ8_0[7168 1024]
-
blk.30.attn_output.weightQ8_0[7168 7168]
-
blk.30.ffn_gate.weightQ8_0[7168 19200]
-
blk.30.ffn_up.weightQ8_0[7168 19200]
-
blk.30.ffn_down.weightQ8_0[19200 7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.31.attn_q.weightQ8_0[7168 7168]
-
blk.31.attn_k.weightQ8_0[7168 1024]
-
blk.31.attn_v.weightQ8_0[7168 1024]
-
blk.31.attn_output.weightQ8_0[7168 7168]
-
blk.31.ffn_gate.weightQ8_0[7168 19200]
-
blk.31.ffn_up.weightQ8_0[7168 19200]
-
blk.31.ffn_down.weightQ8_0[19200 7168]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.32.attn_q.weightQ8_0[7168 7168]
-
blk.32.attn_k.weightQ8_0[7168 1024]
-
blk.32.attn_v.weightQ8_0[7168 1024]
-
blk.32.attn_output.weightQ8_0[7168 7168]
-
blk.32.ffn_gate.weightQ8_0[7168 19200]
-
blk.32.ffn_up.weightQ8_0[7168 19200]
-
blk.32.ffn_down.weightQ8_0[19200 7168]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.33.attn_q.weightQ8_0[7168 7168]
-
blk.33.attn_k.weightQ8_0[7168 1024]
-
blk.33.attn_v.weightQ8_0[7168 1024]
-
blk.33.attn_output.weightQ8_0[7168 7168]
-
blk.33.ffn_gate.weightQ8_0[7168 19200]
-
blk.33.ffn_up.weightQ8_0[7168 19200]
-
blk.33.ffn_down.weightQ8_0[19200 7168]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_q.weightQ8_0[7168 7168]
-
blk.34.attn_k.weightQ8_0[7168 1024]
-
blk.34.attn_v.weightQ8_0[7168 1024]
-
blk.34.attn_output.weightQ8_0[7168 7168]
-
blk.34.ffn_gate.weightQ8_0[7168 19200]
-
blk.34.ffn_up.weightQ8_0[7168 19200]
-
blk.34.ffn_down.weightQ8_0[19200 7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.35.attn_q.weightQ8_0[7168 7168]
-
blk.35.attn_k.weightQ8_0[7168 1024]
-
blk.35.attn_v.weightQ8_0[7168 1024]
-
blk.35.attn_output.weightQ8_0[7168 7168]
-
blk.35.ffn_gate.weightQ8_0[7168 19200]
-
blk.35.ffn_up.weightQ8_0[7168 19200]
-
blk.35.ffn_down.weightQ8_0[19200 7168]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.36.attn_q.weightQ8_0[7168 7168]
-
blk.36.attn_k.weightQ8_0[7168 1024]
-
blk.36.attn_v.weightQ8_0[7168 1024]
-
blk.36.attn_output.weightQ8_0[7168 7168]
-
blk.36.ffn_gate.weightQ8_0[7168 19200]
-
blk.36.ffn_up.weightQ8_0[7168 19200]
-
blk.36.ffn_down.weightQ8_0[19200 7168]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.37.attn_q.weightQ8_0[7168 7168]
-
blk.37.attn_k.weightQ8_0[7168 1024]
-
blk.37.attn_v.weightQ8_0[7168 1024]
-
blk.37.attn_output.weightQ8_0[7168 7168]
-
blk.37.ffn_gate.weightQ8_0[7168 19200]
-
blk.37.ffn_up.weightQ8_0[7168 19200]
-
blk.37.ffn_down.weightQ8_0[19200 7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.38.attn_q.weightQ8_0[7168 7168]
-
blk.38.attn_k.weightQ8_0[7168 1024]
-
blk.38.attn_v.weightQ8_0[7168 1024]
-
blk.38.attn_output.weightQ8_0[7168 7168]
-
blk.38.ffn_gate.weightQ8_0[7168 19200]
-
blk.38.ffn_up.weightQ8_0[7168 19200]
-
blk.38.ffn_down.weightQ8_0[19200 7168]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_q.weightQ8_0[7168 7168]
-
blk.39.attn_k.weightQ8_0[7168 1024]
-
blk.39.attn_v.weightQ8_0[7168 1024]
-
blk.39.attn_output.weightQ8_0[7168 7168]
-
blk.39.ffn_gate.weightQ8_0[7168 19200]
-
blk.39.ffn_up.weightQ8_0[7168 19200]
-
blk.39.ffn_down.weightQ8_0[19200 7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.40.attn_q.weightQ8_0[7168 7168]
-
blk.40.attn_k.weightQ8_0[7168 1024]
-
blk.40.attn_v.weightQ8_0[7168 1024]
-
blk.40.attn_output.weightQ8_0[7168 7168]
-
blk.40.ffn_gate.weightQ8_0[7168 19200]
-
blk.40.ffn_up.weightQ8_0[7168 19200]
-
blk.40.ffn_down.weightQ8_0[19200 7168]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.41.attn_q.weightQ8_0[7168 7168]
-
blk.41.attn_k.weightQ8_0[7168 1024]
-
blk.41.attn_v.weightQ8_0[7168 1024]
-
blk.41.attn_output.weightQ8_0[7168 7168]
-
blk.41.ffn_gate.weightQ8_0[7168 19200]
-
blk.41.ffn_up.weightQ8_0[7168 19200]
-
blk.41.ffn_down.weightQ8_0[19200 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.42.attn_q.weightQ8_0[7168 7168]
-
blk.42.attn_k.weightQ8_0[7168 1024]
-
blk.42.attn_v.weightQ8_0[7168 1024]
-
blk.42.attn_output.weightQ8_0[7168 7168]
-
blk.42.ffn_gate.weightQ8_0[7168 19200]
-
blk.42.ffn_up.weightQ8_0[7168 19200]
-
blk.42.ffn_down.weightQ8_0[19200 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_q.weightQ8_0[7168 7168]
-
blk.43.attn_k.weightQ8_0[7168 1024]
-
blk.43.attn_v.weightQ8_0[7168 1024]
-
blk.43.attn_output.weightQ8_0[7168 7168]
-
blk.43.ffn_gate.weightQ8_0[7168 19200]
-
blk.43.ffn_up.weightQ8_0[7168 19200]
-
blk.43.ffn_down.weightQ8_0[19200 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.44.attn_q.weightQ8_0[7168 7168]
-
blk.44.attn_k.weightQ8_0[7168 1024]
-
blk.44.attn_v.weightQ8_0[7168 1024]
-
blk.44.attn_output.weightQ8_0[7168 7168]
-
blk.44.ffn_gate.weightQ8_0[7168 19200]
-
blk.44.ffn_up.weightQ8_0[7168 19200]
-
blk.44.ffn_down.weightQ8_0[19200 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.45.attn_q.weightQ8_0[7168 7168]
-
blk.45.attn_k.weightQ8_0[7168 1024]
-
blk.45.attn_v.weightQ8_0[7168 1024]
-
blk.45.attn_output.weightQ8_0[7168 7168]
-
blk.45.ffn_gate.weightQ8_0[7168 19200]
-
blk.45.ffn_up.weightQ8_0[7168 19200]
-
blk.45.ffn_down.weightQ8_0[19200 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.46.attn_q.weightQ8_0[7168 7168]
-
blk.46.attn_k.weightQ8_0[7168 1024]
-
blk.46.attn_v.weightQ8_0[7168 1024]
-
blk.46.attn_output.weightQ8_0[7168 7168]
-
blk.46.ffn_gate.weightQ8_0[7168 19200]
-
blk.46.ffn_up.weightQ8_0[7168 19200]
-
blk.46.ffn_down.weightQ8_0[19200 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_q.weightQ8_0[7168 7168]
-
blk.47.attn_k.weightQ8_0[7168 1024]
-
blk.47.attn_v.weightQ8_0[7168 1024]
-
blk.47.attn_output.weightQ8_0[7168 7168]
-
blk.47.ffn_gate.weightQ8_0[7168 19200]
-
blk.47.ffn_up.weightQ8_0[7168 19200]
-
blk.47.ffn_down.weightQ8_0[19200 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.48.attn_q.weightQ8_0[7168 7168]
-
blk.48.attn_k.weightQ8_0[7168 1024]
-
blk.48.attn_v.weightQ8_0[7168 1024]
-
blk.48.attn_output.weightQ8_0[7168 7168]
-
blk.48.ffn_gate.weightQ8_0[7168 19200]
-
blk.48.ffn_up.weightQ8_0[7168 19200]
-
blk.48.ffn_down.weightQ8_0[19200 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.49.attn_q.weightQ8_0[7168 7168]
-
blk.49.attn_k.weightQ8_0[7168 1024]
-
blk.49.attn_v.weightQ8_0[7168 1024]
-
blk.49.attn_output.weightQ8_0[7168 7168]
-
blk.49.ffn_gate.weightQ8_0[7168 19200]
-
blk.49.ffn_up.weightQ8_0[7168 19200]
-
blk.49.ffn_down.weightQ8_0[19200 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.50.attn_q.weightQ8_0[7168 7168]
-
blk.50.attn_k.weightQ8_0[7168 1024]
-
blk.50.attn_v.weightQ8_0[7168 1024]
-
blk.50.attn_output.weightQ8_0[7168 7168]
-
blk.50.ffn_gate.weightQ8_0[7168 19200]
-
blk.50.ffn_up.weightQ8_0[7168 19200]
-
blk.50.ffn_down.weightQ8_0[19200 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.51.attn_q.weightQ8_0[7168 7168]
-
blk.51.attn_k.weightQ8_0[7168 1024]
-
blk.51.attn_v.weightQ8_0[7168 1024]
-
blk.51.attn_output.weightQ8_0[7168 7168]
-
blk.51.ffn_gate.weightQ8_0[7168 19200]
-
blk.51.ffn_up.weightQ8_0[7168 19200]
-
blk.51.ffn_down.weightQ8_0[19200 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_q.weightQ8_0[7168 7168]
-
blk.52.attn_k.weightQ8_0[7168 1024]
-
blk.52.attn_v.weightQ8_0[7168 1024]
-
blk.52.attn_output.weightQ8_0[7168 7168]
-
blk.52.ffn_gate.weightQ8_0[7168 19200]
-
blk.52.ffn_up.weightQ8_0[7168 19200]
-
blk.52.ffn_down.weightQ8_0[19200 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.53.attn_q.weightQ8_0[7168 7168]
-
blk.53.attn_k.weightQ8_0[7168 1024]
-
blk.53.attn_v.weightQ8_0[7168 1024]
-
blk.53.attn_output.weightQ8_0[7168 7168]
-
blk.53.ffn_gate.weightQ8_0[7168 19200]
-
blk.53.ffn_up.weightQ8_0[7168 19200]
-
blk.53.ffn_down.weightQ8_0[19200 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.54.attn_q.weightQ8_0[7168 7168]
-
blk.54.attn_k.weightQ8_0[7168 1024]
-
blk.54.attn_v.weightQ8_0[7168 1024]
-
blk.54.attn_output.weightQ8_0[7168 7168]
-
blk.54.ffn_gate.weightQ8_0[7168 19200]
-
blk.54.ffn_up.weightQ8_0[7168 19200]
-
blk.54.ffn_down.weightQ8_0[19200 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.55.attn_q.weightQ8_0[7168 7168]
-
blk.55.attn_k.weightQ8_0[7168 1024]
-
blk.55.attn_v.weightQ8_0[7168 1024]
-
blk.55.attn_output.weightQ8_0[7168 7168]
-
blk.55.ffn_gate.weightQ8_0[7168 19200]
-
blk.55.ffn_up.weightQ8_0[7168 19200]
-
blk.55.ffn_down.weightQ8_0[19200 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_q.weightQ8_0[7168 7168]
-
blk.56.attn_k.weightQ8_0[7168 1024]
-
blk.56.attn_v.weightQ8_0[7168 1024]
-
blk.56.attn_output.weightQ8_0[7168 7168]
-
blk.56.ffn_gate.weightQ8_0[7168 19200]
-
blk.56.ffn_up.weightQ8_0[7168 19200]
-
blk.56.ffn_down.weightQ8_0[19200 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.57.attn_q.weightQ8_0[7168 7168]
-
blk.57.attn_k.weightQ8_0[7168 1024]
-
blk.57.attn_v.weightQ8_0[7168 1024]
-
blk.57.attn_output.weightQ8_0[7168 7168]
-
blk.57.ffn_gate.weightQ8_0[7168 19200]
-
blk.57.ffn_up.weightQ8_0[7168 19200]
-
blk.57.ffn_down.weightQ8_0[19200 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.58.attn_q.weightQ8_0[7168 7168]
-
blk.58.attn_k.weightQ8_0[7168 1024]
-
blk.58.attn_v.weightQ8_0[7168 1024]
-
blk.58.attn_output.weightQ8_0[7168 7168]
-
blk.58.ffn_gate.weightQ8_0[7168 19200]
-
blk.58.ffn_up.weightQ8_0[7168 19200]
-
blk.58.ffn_down.weightQ8_0[19200 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.59.attn_q.weightQ8_0[7168 7168]
-
blk.59.attn_k.weightQ8_0[7168 1024]
-
blk.59.attn_v.weightQ8_0[7168 1024]
-
blk.59.attn_output.weightQ8_0[7168 7168]
-
blk.59.ffn_gate.weightQ8_0[7168 19200]
-
blk.59.ffn_up.weightQ8_0[7168 19200]
-
blk.59.ffn_down.weightQ8_0[19200 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.60.attn_q.weightQ8_0[7168 7168]
-
blk.60.attn_k.weightQ8_0[7168 1024]
-
blk.60.attn_v.weightQ8_0[7168 1024]
-
blk.60.attn_output.weightQ8_0[7168 7168]
-
blk.60.ffn_gate.weightQ8_0[7168 19200]
-
blk.60.ffn_up.weightQ8_0[7168 19200]
-
blk.60.ffn_down.weightQ8_0[19200 7168]
-
blk.60.attn_norm.weightF32[7168]
-
blk.60.ffn_norm.weightF32[7168]
-
blk.61.attn_q.weightQ8_0[7168 7168]
-
blk.61.attn_k.weightQ8_0[7168 1024]
-
blk.61.attn_v.weightQ8_0[7168 1024]
-
blk.61.attn_output.weightQ8_0[7168 7168]
-
blk.61.ffn_gate.weightQ8_0[7168 19200]
-
blk.61.ffn_up.weightQ8_0[7168 19200]
-
blk.61.ffn_down.weightQ8_0[19200 7168]
-
blk.61.attn_norm.weightF32[7168]
-
blk.61.ffn_norm.weightF32[7168]
-
output_norm.weightF32[7168]
-
output.weightQ8_0[7168 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61