latest
39GB
An assistant in a variety of infrastructural and deployment task
70B
7 Pulls Updated 5 months ago
1436d66b6975 · 39GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length2048
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[8192 32016]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[28672 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 28672]
-
blk.0.ffn_up.weightQ4_0[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[28672 8192]
-
blk.1.ffn_gate.weightQ4_0[8192 28672]
-
blk.1.ffn_up.weightQ4_0[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.2.ffn_gate.weightQ4_0[8192 28672]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[28672 8192]
-
blk.2.ffn_up.weightQ4_0[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[28672 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 28672]
-
blk.3.ffn_up.weightQ4_0[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[28672 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 28672]
-
blk.4.ffn_up.weightQ4_0[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[28672 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 28672]
-
blk.5.ffn_up.weightQ4_0[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[28672 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 28672]
-
blk.6.ffn_up.weightQ4_0[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[28672 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 28672]
-
blk.7.ffn_up.weightQ4_0[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[28672 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 28672]
-
blk.8.ffn_up.weightQ4_0[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[28672 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 28672]
-
blk.9.ffn_up.weightQ4_0[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[28672 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 28672]
-
blk.10.ffn_up.weightQ4_0[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[28672 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 28672]
-
blk.11.ffn_up.weightQ4_0[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[28672 8192]
-
blk.12.ffn_gate.weightQ4_0[8192 28672]
-
blk.12.ffn_up.weightQ4_0[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.13.ffn_gate.weightQ4_0[8192 28672]
-
blk.13.ffn_up.weightQ4_0[8192 28672]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[28672 8192]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[28672 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 28672]
-
blk.14.ffn_up.weightQ4_0[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[28672 8192]
-
blk.15.ffn_gate.weightQ4_0[8192 28672]
-
blk.15.ffn_up.weightQ4_0[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.16.ffn_gate.weightQ4_0[8192 28672]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[28672 8192]
-
blk.16.ffn_up.weightQ4_0[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[28672 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 28672]
-
blk.17.ffn_up.weightQ4_0[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[28672 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 28672]
-
blk.18.ffn_up.weightQ4_0[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[28672 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 28672]
-
blk.19.ffn_up.weightQ4_0[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[28672 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 28672]
-
blk.20.ffn_up.weightQ4_0[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[28672 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 28672]
-
blk.21.ffn_up.weightQ4_0[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[28672 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 28672]
-
blk.22.ffn_up.weightQ4_0[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[28672 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 28672]
-
blk.23.ffn_up.weightQ4_0[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[28672 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 28672]
-
blk.24.ffn_up.weightQ4_0[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[28672 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 28672]
-
blk.25.ffn_up.weightQ4_0[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[28672 8192]
-
blk.26.ffn_gate.weightQ4_0[8192 28672]
-
blk.26.ffn_up.weightQ4_0[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.27.ffn_gate.weightQ4_0[8192 28672]
-
blk.27.ffn_up.weightQ4_0[8192 28672]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[28672 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[28672 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 28672]
-
blk.28.ffn_up.weightQ4_0[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[28672 8192]
-
blk.29.ffn_gate.weightQ4_0[8192 28672]
-
blk.29.ffn_up.weightQ4_0[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.30.ffn_gate.weightQ4_0[8192 28672]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[28672 8192]
-
blk.30.ffn_up.weightQ4_0[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[28672 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 28672]
-
blk.31.ffn_up.weightQ4_0[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[28672 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 28672]
-
blk.32.ffn_up.weightQ4_0[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[28672 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 28672]
-
blk.33.ffn_up.weightQ4_0[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[28672 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 28672]
-
blk.34.ffn_up.weightQ4_0[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[28672 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 28672]
-
blk.35.ffn_up.weightQ4_0[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[28672 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 28672]
-
blk.36.ffn_up.weightQ4_0[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[28672 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 28672]
-
blk.37.ffn_up.weightQ4_0[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[28672 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 28672]
-
blk.38.ffn_up.weightQ4_0[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[28672 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 28672]
-
blk.39.ffn_up.weightQ4_0[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[28672 8192]
-
blk.40.ffn_gate.weightQ4_0[8192 28672]
-
blk.40.ffn_up.weightQ4_0[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.41.ffn_gate.weightQ4_0[8192 28672]
-
blk.41.ffn_up.weightQ4_0[8192 28672]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[28672 8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[28672 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 28672]
-
blk.42.ffn_up.weightQ4_0[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[28672 8192]
-
blk.43.ffn_gate.weightQ4_0[8192 28672]
-
blk.43.ffn_up.weightQ4_0[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.44.ffn_gate.weightQ4_0[8192 28672]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[28672 8192]
-
blk.44.ffn_up.weightQ4_0[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[28672 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 28672]
-
blk.45.ffn_up.weightQ4_0[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[28672 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 28672]
-
blk.46.ffn_up.weightQ4_0[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[28672 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 28672]
-
blk.47.ffn_up.weightQ4_0[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_0[28672 8192]
-
blk.48.ffn_gate.weightQ4_0[8192 28672]
-
blk.48.ffn_up.weightQ4_0[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_0[8192 1024]
-
blk.48.attn_output.weightQ4_0[8192 8192]
-
blk.48.attn_q.weightQ4_0[8192 8192]
-
blk.48.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_0[28672 8192]
-
blk.49.ffn_gate.weightQ4_0[8192 28672]
-
blk.49.ffn_up.weightQ4_0[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.weightQ4_0[8192 1024]
-
blk.49.attn_output.weightQ4_0[8192 8192]
-
blk.49.attn_q.weightQ4_0[8192 8192]
-
blk.49.attn_v.weightQ4_0[8192 1024]
-
blk.50.attn_k.weightQ4_0[8192 1024]
-
blk.50.attn_q.weightQ4_0[8192 8192]
-
blk.50.attn_v.weightQ4_0[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ4_0[28672 8192]
-
blk.50.ffn_gate.weightQ4_0[8192 28672]
-
blk.50.ffn_up.weightQ4_0[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_0[28672 8192]
-
blk.51.ffn_gate.weightQ4_0[8192 28672]
-
blk.51.ffn_up.weightQ4_0[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_0[8192 1024]
-
blk.51.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_q.weightQ4_0[8192 8192]
-
blk.51.attn_v.weightQ4_0[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_0[28672 8192]
-
blk.52.ffn_gate.weightQ4_0[8192 28672]
-
blk.52.ffn_up.weightQ4_0[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_0[8192 1024]
-
blk.52.attn_output.weightQ4_0[8192 8192]
-
blk.52.attn_q.weightQ4_0[8192 8192]
-
blk.52.attn_v.weightQ4_0[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_0[28672 8192]
-
blk.53.ffn_gate.weightQ4_0[8192 28672]
-
blk.53.ffn_up.weightQ4_0[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ4_0[8192 1024]
-
blk.53.attn_output.weightQ4_0[8192 8192]
-
blk.53.attn_q.weightQ4_0[8192 8192]
-
blk.53.attn_v.weightQ4_0[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ4_0[28672 8192]
-
blk.54.ffn_gate.weightQ4_0[8192 28672]
-
blk.54.ffn_up.weightQ4_0[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.weightQ4_0[8192 1024]
-
blk.54.attn_output.weightQ4_0[8192 8192]
-
blk.54.attn_q.weightQ4_0[8192 8192]
-
blk.54.attn_v.weightQ4_0[8192 1024]
-
blk.55.ffn_gate.weightQ4_0[8192 28672]
-
blk.55.ffn_up.weightQ4_0[8192 28672]
-
blk.55.attn_k.weightQ4_0[8192 1024]
-
blk.55.attn_output.weightQ4_0[8192 8192]
-
blk.55.attn_q.weightQ4_0[8192 8192]
-
blk.55.attn_v.weightQ4_0[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_0[28672 8192]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ4_0[28672 8192]
-
blk.56.ffn_gate.weightQ4_0[8192 28672]
-
blk.56.ffn_up.weightQ4_0[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ4_0[8192 1024]
-
blk.56.attn_output.weightQ4_0[8192 8192]
-
blk.56.attn_q.weightQ4_0[8192 8192]
-
blk.56.attn_v.weightQ4_0[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ4_0[28672 8192]
-
blk.57.ffn_gate.weightQ4_0[8192 28672]
-
blk.57.ffn_up.weightQ4_0[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.weightQ4_0[8192 1024]
-
blk.57.attn_output.weightQ4_0[8192 8192]
-
blk.57.attn_q.weightQ4_0[8192 8192]
-
blk.57.attn_v.weightQ4_0[8192 1024]
-
blk.58.ffn_gate.weightQ4_0[8192 28672]
-
blk.58.attn_k.weightQ4_0[8192 1024]
-
blk.58.attn_output.weightQ4_0[8192 8192]
-
blk.58.attn_q.weightQ4_0[8192 8192]
-
blk.58.attn_v.weightQ4_0[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_0[28672 8192]
-
blk.58.ffn_up.weightQ4_0[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_0[28672 8192]
-
blk.59.ffn_gate.weightQ4_0[8192 28672]
-
blk.59.ffn_up.weightQ4_0[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_0[8192 1024]
-
blk.59.attn_output.weightQ4_0[8192 8192]
-
blk.59.attn_q.weightQ4_0[8192 8192]
-
blk.59.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_0[28672 8192]
-
blk.60.ffn_gate.weightQ4_0[8192 28672]
-
blk.60.ffn_up.weightQ4_0[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.weightQ4_0[8192 1024]
-
blk.60.attn_output.weightQ4_0[8192 8192]
-
blk.60.attn_q.weightQ4_0[8192 8192]
-
blk.60.attn_v.weightQ4_0[8192 1024]
-
blk.61.attn_k.weightQ4_0[8192 1024]
-
blk.61.attn_output.weightQ4_0[8192 8192]
-
blk.61.attn_q.weightQ4_0[8192 8192]
-
blk.61.attn_v.weightQ4_0[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_0[28672 8192]
-
blk.61.ffn_gate.weightQ4_0[8192 28672]
-
blk.61.ffn_up.weightQ4_0[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_0[28672 8192]
-
blk.62.ffn_gate.weightQ4_0[8192 28672]
-
blk.62.ffn_up.weightQ4_0[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_0[8192 1024]
-
blk.62.attn_output.weightQ4_0[8192 8192]
-
blk.62.attn_q.weightQ4_0[8192 8192]
-
blk.62.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_0[28672 8192]
-
blk.63.ffn_gate.weightQ4_0[8192 28672]
-
blk.63.ffn_up.weightQ4_0[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.weightQ4_0[8192 1024]
-
blk.63.attn_output.weightQ4_0[8192 8192]
-
blk.63.attn_q.weightQ4_0[8192 8192]
-
blk.63.attn_v.weightQ4_0[8192 1024]
-
blk.64.attn_k.weightQ4_0[8192 1024]
-
blk.64.attn_q.weightQ4_0[8192 8192]
-
blk.64.attn_v.weightQ4_0[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_0[28672 8192]
-
blk.64.ffn_gate.weightQ4_0[8192 28672]
-
blk.64.ffn_up.weightQ4_0[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_0[28672 8192]
-
blk.65.ffn_gate.weightQ4_0[8192 28672]
-
blk.65.ffn_up.weightQ4_0[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_0[8192 1024]
-
blk.65.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_q.weightQ4_0[8192 8192]
-
blk.65.attn_v.weightQ4_0[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_0[28672 8192]
-
blk.66.ffn_gate.weightQ4_0[8192 28672]
-
blk.66.ffn_up.weightQ4_0[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_0[8192 1024]
-
blk.66.attn_output.weightQ4_0[8192 8192]
-
blk.66.attn_q.weightQ4_0[8192 8192]
-
blk.66.attn_v.weightQ4_0[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_0[28672 8192]
-
blk.67.ffn_gate.weightQ4_0[8192 28672]
-
blk.67.ffn_up.weightQ4_0[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ4_0[8192 1024]
-
blk.67.attn_output.weightQ4_0[8192 8192]
-
blk.67.attn_q.weightQ4_0[8192 8192]
-
blk.67.attn_v.weightQ4_0[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_0[28672 8192]
-
blk.68.ffn_gate.weightQ4_0[8192 28672]
-
blk.68.ffn_up.weightQ4_0[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.weightQ4_0[8192 1024]
-
blk.68.attn_output.weightQ4_0[8192 8192]
-
blk.68.attn_q.weightQ4_0[8192 8192]
-
blk.68.attn_v.weightQ4_0[8192 1024]
-
blk.69.ffn_gate.weightQ4_0[8192 28672]
-
blk.69.ffn_up.weightQ4_0[8192 28672]
-
blk.69.attn_k.weightQ4_0[8192 1024]
-
blk.69.attn_output.weightQ4_0[8192 8192]
-
blk.69.attn_q.weightQ4_0[8192 8192]
-
blk.69.attn_v.weightQ4_0[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_0[28672 8192]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ4_0[28672 8192]
-
blk.70.ffn_gate.weightQ4_0[8192 28672]
-
blk.70.ffn_up.weightQ4_0[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ4_0[8192 1024]
-
blk.70.attn_output.weightQ4_0[8192 8192]
-
blk.70.attn_q.weightQ4_0[8192 8192]
-
blk.70.attn_v.weightQ4_0[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_0[28672 8192]
-
blk.71.ffn_gate.weightQ4_0[8192 28672]
-
blk.71.ffn_up.weightQ4_0[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.weightQ4_0[8192 1024]
-
blk.71.attn_output.weightQ4_0[8192 8192]
-
blk.71.attn_q.weightQ4_0[8192 8192]
-
blk.71.attn_v.weightQ4_0[8192 1024]
-
blk.72.ffn_gate.weightQ4_0[8192 28672]
-
blk.72.attn_k.weightQ4_0[8192 1024]
-
blk.72.attn_output.weightQ4_0[8192 8192]
-
blk.72.attn_q.weightQ4_0[8192 8192]
-
blk.72.attn_v.weightQ4_0[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_0[28672 8192]
-
blk.72.ffn_up.weightQ4_0[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ4_0[28672 8192]
-
blk.73.ffn_gate.weightQ4_0[8192 28672]
-
blk.73.ffn_up.weightQ4_0[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_0[8192 1024]
-
blk.73.attn_output.weightQ4_0[8192 8192]
-
blk.73.attn_q.weightQ4_0[8192 8192]
-
blk.73.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_0[28672 8192]
-
blk.74.ffn_gate.weightQ4_0[8192 28672]
-
blk.74.ffn_up.weightQ4_0[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.weightQ4_0[8192 1024]
-
blk.74.attn_output.weightQ4_0[8192 8192]
-
blk.74.attn_q.weightQ4_0[8192 8192]
-
blk.74.attn_v.weightQ4_0[8192 1024]
-
blk.75.attn_k.weightQ4_0[8192 1024]
-
blk.75.attn_output.weightQ4_0[8192 8192]
-
blk.75.attn_q.weightQ4_0[8192 8192]
-
blk.75.attn_v.weightQ4_0[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_0[28672 8192]
-
blk.75.ffn_gate.weightQ4_0[8192 28672]
-
blk.75.ffn_up.weightQ4_0[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ4_0[28672 8192]
-
blk.76.ffn_gate.weightQ4_0[8192 28672]
-
blk.76.ffn_up.weightQ4_0[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_0[8192 1024]
-
blk.76.attn_output.weightQ4_0[8192 8192]
-
blk.76.attn_q.weightQ4_0[8192 8192]
-
blk.76.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_0[28672 8192]
-
blk.77.ffn_gate.weightQ4_0[8192 28672]
-
blk.77.ffn_up.weightQ4_0[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.weightQ4_0[8192 1024]
-
blk.77.attn_output.weightQ4_0[8192 8192]
-
blk.77.attn_q.weightQ4_0[8192 8192]
-
blk.77.attn_v.weightQ4_0[8192 1024]
-
blk.78.attn_k.weightQ4_0[8192 1024]
-
blk.78.attn_q.weightQ4_0[8192 8192]
-
blk.78.attn_v.weightQ4_0[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_0[28672 8192]
-
blk.78.ffn_gate.weightQ4_0[8192 28672]
-
blk.78.ffn_up.weightQ4_0[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_0[28672 8192]
-
blk.79.ffn_gate.weightQ4_0[8192 28672]
-
blk.79.ffn_up.weightQ4_0[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_0[8192 1024]
-
blk.79.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_q.weightQ4_0[8192 8192]
-
blk.79.attn_v.weightQ4_0[8192 1024]
-
output.weightQ6_K[8192 32016]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79