7B
34B
87 Pulls Updated 7 months ago
b7e4fc0f8b8f · 20GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length16384
-
llama.embedding_length8192
-
llama.feed_forward_length22016
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[8192 32001]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ6_K[22016 8192]
-
blk.0.ffn_gate.weightQ4_K[8192 22016]
-
blk.0.ffn_up.weightQ4_K[8192 22016]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_K[8192 1024]
-
blk.0.attn_output.weightQ4_K[8192 8192]
-
blk.0.attn_q.weightQ4_K[8192 8192]
-
blk.0.attn_v.weightQ6_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ6_K[22016 8192]
-
blk.1.ffn_gate.weightQ4_K[8192 22016]
-
blk.1.ffn_up.weightQ4_K[8192 22016]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_K[8192 1024]
-
blk.1.attn_output.weightQ4_K[8192 8192]
-
blk.1.attn_q.weightQ4_K[8192 8192]
-
blk.1.attn_v.weightQ6_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ6_K[22016 8192]
-
blk.2.ffn_gate.weightQ4_K[8192 22016]
-
blk.2.ffn_up.weightQ4_K[8192 22016]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_K[8192 1024]
-
blk.2.attn_output.weightQ4_K[8192 8192]
-
blk.2.attn_q.weightQ4_K[8192 8192]
-
blk.2.attn_v.weightQ6_K[8192 1024]
-
blk.3.attn_k.weightQ4_K[8192 1024]
-
blk.3.attn_output.weightQ4_K[8192 8192]
-
blk.3.attn_q.weightQ4_K[8192 8192]
-
blk.3.attn_v.weightQ6_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ6_K[22016 8192]
-
blk.3.ffn_gate.weightQ4_K[8192 22016]
-
blk.3.ffn_up.weightQ4_K[8192 22016]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ6_K[22016 8192]
-
blk.4.ffn_gate.weightQ4_K[8192 22016]
-
blk.4.ffn_up.weightQ4_K[8192 22016]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_K[8192 1024]
-
blk.4.attn_output.weightQ4_K[8192 8192]
-
blk.4.attn_q.weightQ4_K[8192 8192]
-
blk.4.attn_v.weightQ6_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ6_K[22016 8192]
-
blk.5.ffn_gate.weightQ4_K[8192 22016]
-
blk.5.ffn_up.weightQ4_K[8192 22016]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightQ4_K[8192 1024]
-
blk.5.attn_output.weightQ4_K[8192 8192]
-
blk.5.attn_q.weightQ4_K[8192 8192]
-
blk.5.attn_v.weightQ6_K[8192 1024]
-
blk.6.ffn_gate.weightQ4_K[8192 22016]
-
blk.6.ffn_up.weightQ4_K[8192 22016]
-
blk.6.attn_k.weightQ4_K[8192 1024]
-
blk.6.attn_output.weightQ4_K[8192 8192]
-
blk.6.attn_q.weightQ4_K[8192 8192]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_K[22016 8192]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_K[22016 8192]
-
blk.7.ffn_gate.weightQ4_K[8192 22016]
-
blk.7.ffn_up.weightQ4_K[8192 22016]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_K[8192 1024]
-
blk.7.attn_output.weightQ4_K[8192 8192]
-
blk.7.attn_q.weightQ4_K[8192 8192]
-
blk.7.attn_v.weightQ6_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ6_K[22016 8192]
-
blk.8.ffn_gate.weightQ4_K[8192 22016]
-
blk.8.ffn_up.weightQ4_K[8192 22016]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ4_K[8192 1024]
-
blk.8.attn_output.weightQ4_K[8192 8192]
-
blk.8.attn_q.weightQ4_K[8192 8192]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_K[22016 8192]
-
blk.9.ffn_gate.weightQ4_K[8192 22016]
-
blk.9.ffn_up.weightQ4_K[8192 22016]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_K[8192 1024]
-
blk.9.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_q.weightQ4_K[8192 8192]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_k.weightQ4_K[8192 1024]
-
blk.10.attn_output.weightQ4_K[8192 8192]
-
blk.10.attn_q.weightQ4_K[8192 8192]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_K[22016 8192]
-
blk.10.ffn_gate.weightQ4_K[8192 22016]
-
blk.10.ffn_up.weightQ4_K[8192 22016]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ6_K[22016 8192]
-
blk.11.ffn_gate.weightQ4_K[8192 22016]
-
blk.11.ffn_up.weightQ4_K[8192 22016]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_K[8192 1024]
-
blk.11.attn_output.weightQ4_K[8192 8192]
-
blk.11.attn_q.weightQ4_K[8192 8192]
-
blk.11.attn_v.weightQ6_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_K[22016 8192]
-
blk.12.ffn_gate.weightQ4_K[8192 22016]
-
blk.12.ffn_up.weightQ4_K[8192 22016]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ4_K[8192 1024]
-
blk.12.attn_output.weightQ4_K[8192 8192]
-
blk.12.attn_q.weightQ4_K[8192 8192]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.13.ffn_gate.weightQ4_K[8192 22016]
-
blk.13.ffn_up.weightQ4_K[8192 22016]
-
blk.13.attn_k.weightQ4_K[8192 1024]
-
blk.13.attn_output.weightQ4_K[8192 8192]
-
blk.13.attn_q.weightQ4_K[8192 8192]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_K[22016 8192]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ6_K[22016 8192]
-
blk.14.ffn_gate.weightQ4_K[8192 22016]
-
blk.14.ffn_up.weightQ4_K[8192 22016]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_K[8192 1024]
-
blk.14.attn_output.weightQ4_K[8192 8192]
-
blk.14.attn_q.weightQ4_K[8192 8192]
-
blk.14.attn_v.weightQ6_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_K[22016 8192]
-
blk.15.ffn_gate.weightQ4_K[8192 22016]
-
blk.15.ffn_up.weightQ4_K[8192 22016]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_K[8192 1024]
-
blk.15.attn_output.weightQ4_K[8192 8192]
-
blk.15.attn_q.weightQ4_K[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_K[22016 8192]
-
blk.16.ffn_gate.weightQ4_K[8192 22016]
-
blk.16.ffn_up.weightQ4_K[8192 22016]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ4_K[8192 1024]
-
blk.16.attn_output.weightQ4_K[8192 8192]
-
blk.16.attn_q.weightQ4_K[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_k.weightQ4_K[8192 1024]
-
blk.17.attn_output.weightQ4_K[8192 8192]
-
blk.17.attn_q.weightQ4_K[8192 8192]
-
blk.17.attn_v.weightQ6_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ6_K[22016 8192]
-
blk.17.ffn_gate.weightQ4_K[8192 22016]
-
blk.17.ffn_up.weightQ4_K[8192 22016]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_K[22016 8192]
-
blk.18.ffn_gate.weightQ4_K[8192 22016]
-
blk.18.ffn_up.weightQ4_K[8192 22016]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ4_K[8192 1024]
-
blk.18.attn_output.weightQ4_K[8192 8192]
-
blk.18.attn_q.weightQ4_K[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_K[22016 8192]
-
blk.19.ffn_gate.weightQ4_K[8192 22016]
-
blk.19.ffn_up.weightQ4_K[8192 22016]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ4_K[8192 1024]
-
blk.19.attn_output.weightQ4_K[8192 8192]
-
blk.19.attn_q.weightQ4_K[8192 8192]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.ffn_gate.weightQ4_K[8192 22016]
-
blk.20.ffn_up.weightQ4_K[8192 22016]
-
blk.20.attn_k.weightQ4_K[8192 1024]
-
blk.20.attn_output.weightQ4_K[8192 8192]
-
blk.20.attn_q.weightQ4_K[8192 8192]
-
blk.20.attn_v.weightQ6_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ6_K[22016 8192]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_K[22016 8192]
-
blk.21.ffn_gate.weightQ4_K[8192 22016]
-
blk.21.ffn_up.weightQ4_K[8192 22016]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ4_K[8192 1024]
-
blk.21.attn_output.weightQ4_K[8192 8192]
-
blk.21.attn_q.weightQ4_K[8192 8192]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_K[22016 8192]
-
blk.22.ffn_gate.weightQ4_K[8192 22016]
-
blk.22.ffn_up.weightQ4_K[8192 22016]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ4_K[8192 1024]
-
blk.22.attn_output.weightQ4_K[8192 8192]
-
blk.22.attn_q.weightQ4_K[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ6_K[22016 8192]
-
blk.23.ffn_gate.weightQ4_K[8192 22016]
-
blk.23.ffn_up.weightQ4_K[8192 22016]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_K[8192 1024]
-
blk.23.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_q.weightQ4_K[8192 8192]
-
blk.23.attn_v.weightQ6_K[8192 1024]
-
blk.24.attn_k.weightQ4_K[8192 1024]
-
blk.24.attn_output.weightQ4_K[8192 8192]
-
blk.24.attn_q.weightQ4_K[8192 8192]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_K[22016 8192]
-
blk.24.ffn_gate.weightQ4_K[8192 22016]
-
blk.24.ffn_up.weightQ4_K[8192 22016]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_K[22016 8192]
-
blk.25.ffn_gate.weightQ4_K[8192 22016]
-
blk.25.ffn_up.weightQ4_K[8192 22016]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_K[8192 1024]
-
blk.25.attn_output.weightQ4_K[8192 8192]
-
blk.25.attn_q.weightQ4_K[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ6_K[22016 8192]
-
blk.26.ffn_gate.weightQ4_K[8192 22016]
-
blk.26.ffn_up.weightQ4_K[8192 22016]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_K[8192 1024]
-
blk.26.attn_output.weightQ4_K[8192 8192]
-
blk.26.attn_q.weightQ4_K[8192 8192]
-
blk.26.attn_v.weightQ6_K[8192 1024]
-
blk.27.ffn_gate.weightQ4_K[8192 22016]
-
blk.27.ffn_up.weightQ4_K[8192 22016]
-
blk.27.attn_k.weightQ4_K[8192 1024]
-
blk.27.attn_output.weightQ4_K[8192 8192]
-
blk.27.attn_q.weightQ4_K[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_K[22016 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_K[22016 8192]
-
blk.28.ffn_gate.weightQ4_K[8192 22016]
-
blk.28.ffn_up.weightQ4_K[8192 22016]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_K[8192 1024]
-
blk.28.attn_output.weightQ4_K[8192 8192]
-
blk.28.attn_q.weightQ4_K[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ6_K[22016 8192]
-
blk.29.ffn_gate.weightQ4_K[8192 22016]
-
blk.29.ffn_up.weightQ4_K[8192 22016]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_K[8192 1024]
-
blk.29.attn_output.weightQ4_K[8192 8192]
-
blk.29.attn_q.weightQ4_K[8192 8192]
-
blk.29.attn_v.weightQ6_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_K[22016 8192]
-
blk.30.ffn_gate.weightQ4_K[8192 22016]
-
blk.30.ffn_up.weightQ4_K[8192 22016]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ4_K[8192 1024]
-
blk.30.attn_output.weightQ4_K[8192 8192]
-
blk.30.attn_q.weightQ4_K[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_k.weightQ4_K[8192 1024]
-
blk.31.attn_output.weightQ4_K[8192 8192]
-
blk.31.attn_q.weightQ4_K[8192 8192]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_K[22016 8192]
-
blk.31.ffn_gate.weightQ4_K[8192 22016]
-
blk.31.ffn_up.weightQ4_K[8192 22016]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ6_K[22016 8192]
-
blk.32.ffn_gate.weightQ4_K[8192 22016]
-
blk.32.ffn_up.weightQ4_K[8192 22016]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_K[8192 1024]
-
blk.32.attn_output.weightQ4_K[8192 8192]
-
blk.32.attn_q.weightQ4_K[8192 8192]
-
blk.32.attn_v.weightQ6_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_K[22016 8192]
-
blk.33.ffn_gate.weightQ4_K[8192 22016]
-
blk.33.ffn_up.weightQ4_K[8192 22016]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ4_K[8192 1024]
-
blk.33.attn_output.weightQ4_K[8192 8192]
-
blk.33.attn_q.weightQ4_K[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.ffn_gate.weightQ4_K[8192 22016]
-
blk.34.ffn_up.weightQ4_K[8192 22016]
-
blk.34.attn_k.weightQ4_K[8192 1024]
-
blk.34.attn_output.weightQ4_K[8192 8192]
-
blk.34.attn_q.weightQ4_K[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_K[22016 8192]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ6_K[22016 8192]
-
blk.35.ffn_gate.weightQ4_K[8192 22016]
-
blk.35.ffn_up.weightQ4_K[8192 22016]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_K[8192 1024]
-
blk.35.attn_output.weightQ4_K[8192 8192]
-
blk.35.attn_q.weightQ4_K[8192 8192]
-
blk.35.attn_v.weightQ6_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_K[22016 8192]
-
blk.36.ffn_gate.weightQ4_K[8192 22016]
-
blk.36.ffn_up.weightQ4_K[8192 22016]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ4_K[8192 1024]
-
blk.36.attn_output.weightQ4_K[8192 8192]
-
blk.36.attn_q.weightQ4_K[8192 8192]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_K[22016 8192]
-
blk.37.ffn_gate.weightQ4_K[8192 22016]
-
blk.37.ffn_up.weightQ4_K[8192 22016]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_K[8192 1024]
-
blk.37.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_q.weightQ4_K[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_k.weightQ4_K[8192 1024]
-
blk.38.attn_output.weightQ4_K[8192 8192]
-
blk.38.attn_q.weightQ4_K[8192 8192]
-
blk.38.attn_v.weightQ6_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ6_K[22016 8192]
-
blk.38.ffn_gate.weightQ4_K[8192 22016]
-
blk.38.ffn_up.weightQ4_K[8192 22016]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_K[22016 8192]
-
blk.39.ffn_gate.weightQ4_K[8192 22016]
-
blk.39.ffn_up.weightQ4_K[8192 22016]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_K[8192 1024]
-
blk.39.attn_output.weightQ4_K[8192 8192]
-
blk.39.attn_q.weightQ4_K[8192 8192]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_K[22016 8192]
-
blk.40.ffn_gate.weightQ4_K[8192 22016]
-
blk.40.ffn_up.weightQ4_K[8192 22016]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_K[8192 1024]
-
blk.40.attn_output.weightQ4_K[8192 8192]
-
blk.40.attn_q.weightQ4_K[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.ffn_gate.weightQ4_K[8192 22016]
-
blk.41.ffn_up.weightQ4_K[8192 22016]
-
blk.41.attn_k.weightQ4_K[8192 1024]
-
blk.41.attn_output.weightQ4_K[8192 8192]
-
blk.41.attn_q.weightQ4_K[8192 8192]
-
blk.41.attn_v.weightQ6_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ6_K[22016 8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ6_K[22016 8192]
-
blk.42.ffn_gate.weightQ4_K[8192 22016]
-
blk.42.ffn_up.weightQ4_K[8192 22016]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_K[8192 1024]
-
blk.42.attn_output.weightQ4_K[8192 8192]
-
blk.42.attn_q.weightQ4_K[8192 8192]
-
blk.42.attn_v.weightQ6_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ6_K[22016 8192]
-
blk.43.ffn_gate.weightQ4_K[8192 22016]
-
blk.43.ffn_up.weightQ4_K[8192 22016]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_K[8192 1024]
-
blk.43.attn_output.weightQ4_K[8192 8192]
-
blk.43.attn_q.weightQ4_K[8192 8192]
-
blk.43.attn_v.weightQ6_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ6_K[22016 8192]
-
blk.44.ffn_gate.weightQ4_K[8192 22016]
-
blk.44.ffn_up.weightQ4_K[8192 22016]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ4_K[8192 1024]
-
blk.44.attn_output.weightQ4_K[8192 8192]
-
blk.44.attn_q.weightQ4_K[8192 8192]
-
blk.44.attn_v.weightQ6_K[8192 1024]
-
blk.45.attn_k.weightQ4_K[8192 1024]
-
blk.45.attn_output.weightQ4_K[8192 8192]
-
blk.45.attn_q.weightQ4_K[8192 8192]
-
blk.45.attn_v.weightQ6_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ6_K[22016 8192]
-
blk.45.ffn_gate.weightQ4_K[8192 22016]
-
blk.45.ffn_up.weightQ4_K[8192 22016]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ6_K[22016 8192]
-
blk.46.ffn_gate.weightQ4_K[8192 22016]
-
blk.46.ffn_up.weightQ4_K[8192 22016]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_K[8192 1024]
-
blk.46.attn_output.weightQ4_K[8192 8192]
-
blk.46.attn_q.weightQ4_K[8192 8192]
-
blk.46.attn_v.weightQ6_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ6_K[22016 8192]
-
blk.47.ffn_gate.weightQ4_K[8192 22016]
-
blk.47.ffn_up.weightQ4_K[8192 22016]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ4_K[8192 1024]
-
blk.47.attn_output.weightQ4_K[8192 8192]
-
blk.47.attn_q.weightQ4_K[8192 8192]
-
blk.47.attn_v.weightQ6_K[8192 1024]
-
output.weightQ6_K[8192 32001]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47