Custom Mistral Mini 22b finetuned by TheDrummer (Source: https://huggingface.co/TheDrummer/Cydonia-22B-v1.1)
Tools
22B
33 Pulls Updated 11 days ago
357ef802c976 · 18GB
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count56
-
llama.context_length131072
-
llama.embedding_length6144
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32768
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[6144 32768]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_down.weightQ6_K[16384 6144]
-
blk.0.ffn_gate.weightQ6_K[6144 16384]
-
blk.0.ffn_up.weightQ6_K[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.attn_k.weightQ6_K[6144 1024]
-
blk.0.attn_output.weightQ6_K[6144 6144]
-
blk.0.attn_q.weightQ6_K[6144 6144]
-
blk.0.attn_v.weightQ6_K[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_down.weightQ6_K[16384 6144]
-
blk.1.ffn_gate.weightQ6_K[6144 16384]
-
blk.1.ffn_up.weightQ6_K[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.attn_k.weightQ6_K[6144 1024]
-
blk.1.attn_output.weightQ6_K[6144 6144]
-
blk.1.attn_q.weightQ6_K[6144 6144]
-
blk.1.attn_v.weightQ6_K[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_down.weightQ6_K[16384 6144]
-
blk.2.ffn_gate.weightQ6_K[6144 16384]
-
blk.2.ffn_up.weightQ6_K[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.attn_k.weightQ6_K[6144 1024]
-
blk.2.attn_output.weightQ6_K[6144 6144]
-
blk.2.attn_q.weightQ6_K[6144 6144]
-
blk.2.attn_v.weightQ6_K[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_down.weightQ6_K[16384 6144]
-
blk.3.ffn_gate.weightQ6_K[6144 16384]
-
blk.3.ffn_up.weightQ6_K[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.attn_k.weightQ6_K[6144 1024]
-
blk.3.attn_output.weightQ6_K[6144 6144]
-
blk.3.attn_q.weightQ6_K[6144 6144]
-
blk.3.attn_v.weightQ6_K[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_down.weightQ6_K[16384 6144]
-
blk.4.ffn_gate.weightQ6_K[6144 16384]
-
blk.4.ffn_up.weightQ6_K[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.attn_k.weightQ6_K[6144 1024]
-
blk.4.attn_output.weightQ6_K[6144 6144]
-
blk.4.attn_q.weightQ6_K[6144 6144]
-
blk.4.attn_v.weightQ6_K[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_down.weightQ6_K[16384 6144]
-
blk.5.ffn_gate.weightQ6_K[6144 16384]
-
blk.5.ffn_up.weightQ6_K[6144 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.attn_k.weightQ6_K[6144 1024]
-
blk.5.attn_output.weightQ6_K[6144 6144]
-
blk.5.attn_q.weightQ6_K[6144 6144]
-
blk.5.attn_v.weightQ6_K[6144 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_down.weightQ6_K[16384 6144]
-
blk.6.ffn_gate.weightQ6_K[6144 16384]
-
blk.6.ffn_up.weightQ6_K[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.attn_k.weightQ6_K[6144 1024]
-
blk.6.attn_output.weightQ6_K[6144 6144]
-
blk.6.attn_q.weightQ6_K[6144 6144]
-
blk.6.attn_v.weightQ6_K[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_down.weightQ6_K[16384 6144]
-
blk.7.ffn_gate.weightQ6_K[6144 16384]
-
blk.7.ffn_up.weightQ6_K[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.attn_k.weightQ6_K[6144 1024]
-
blk.7.attn_output.weightQ6_K[6144 6144]
-
blk.7.attn_q.weightQ6_K[6144 6144]
-
blk.7.attn_v.weightQ6_K[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_down.weightQ6_K[16384 6144]
-
blk.8.ffn_gate.weightQ6_K[6144 16384]
-
blk.8.ffn_up.weightQ6_K[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.attn_k.weightQ6_K[6144 1024]
-
blk.8.attn_output.weightQ6_K[6144 6144]
-
blk.8.attn_q.weightQ6_K[6144 6144]
-
blk.8.attn_v.weightQ6_K[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_down.weightQ6_K[16384 6144]
-
blk.9.ffn_gate.weightQ6_K[6144 16384]
-
blk.9.ffn_up.weightQ6_K[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.attn_k.weightQ6_K[6144 1024]
-
blk.9.attn_output.weightQ6_K[6144 6144]
-
blk.9.attn_q.weightQ6_K[6144 6144]
-
blk.9.attn_v.weightQ6_K[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_down.weightQ6_K[16384 6144]
-
blk.10.ffn_gate.weightQ6_K[6144 16384]
-
blk.10.ffn_up.weightQ6_K[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.attn_k.weightQ6_K[6144 1024]
-
blk.10.attn_output.weightQ6_K[6144 6144]
-
blk.10.attn_q.weightQ6_K[6144 6144]
-
blk.10.attn_v.weightQ6_K[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_down.weightQ6_K[16384 6144]
-
blk.11.ffn_gate.weightQ6_K[6144 16384]
-
blk.11.ffn_up.weightQ6_K[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.attn_k.weightQ6_K[6144 1024]
-
blk.11.attn_output.weightQ6_K[6144 6144]
-
blk.11.attn_q.weightQ6_K[6144 6144]
-
blk.11.attn_v.weightQ6_K[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_down.weightQ6_K[16384 6144]
-
blk.12.ffn_gate.weightQ6_K[6144 16384]
-
blk.12.ffn_up.weightQ6_K[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.attn_k.weightQ6_K[6144 1024]
-
blk.12.attn_output.weightQ6_K[6144 6144]
-
blk.12.attn_q.weightQ6_K[6144 6144]
-
blk.12.attn_v.weightQ6_K[6144 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_down.weightQ6_K[16384 6144]
-
blk.13.ffn_gate.weightQ6_K[6144 16384]
-
blk.13.ffn_up.weightQ6_K[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.attn_k.weightQ6_K[6144 1024]
-
blk.13.attn_output.weightQ6_K[6144 6144]
-
blk.13.attn_q.weightQ6_K[6144 6144]
-
blk.13.attn_v.weightQ6_K[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_down.weightQ6_K[16384 6144]
-
blk.14.ffn_gate.weightQ6_K[6144 16384]
-
blk.14.ffn_up.weightQ6_K[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.attn_k.weightQ6_K[6144 1024]
-
blk.14.attn_output.weightQ6_K[6144 6144]
-
blk.14.attn_q.weightQ6_K[6144 6144]
-
blk.14.attn_v.weightQ6_K[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_down.weightQ6_K[16384 6144]
-
blk.15.ffn_gate.weightQ6_K[6144 16384]
-
blk.15.ffn_up.weightQ6_K[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.attn_k.weightQ6_K[6144 1024]
-
blk.15.attn_output.weightQ6_K[6144 6144]
-
blk.15.attn_q.weightQ6_K[6144 6144]
-
blk.15.attn_v.weightQ6_K[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_down.weightQ6_K[16384 6144]
-
blk.16.ffn_gate.weightQ6_K[6144 16384]
-
blk.16.ffn_up.weightQ6_K[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.attn_k.weightQ6_K[6144 1024]
-
blk.16.attn_output.weightQ6_K[6144 6144]
-
blk.16.attn_q.weightQ6_K[6144 6144]
-
blk.16.attn_v.weightQ6_K[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_down.weightQ6_K[16384 6144]
-
blk.17.ffn_gate.weightQ6_K[6144 16384]
-
blk.17.ffn_up.weightQ6_K[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.attn_k.weightQ6_K[6144 1024]
-
blk.17.attn_output.weightQ6_K[6144 6144]
-
blk.17.attn_q.weightQ6_K[6144 6144]
-
blk.17.attn_v.weightQ6_K[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.weightQ6_K[16384 6144]
-
blk.18.ffn_gate.weightQ6_K[6144 16384]
-
blk.18.ffn_up.weightQ6_K[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.attn_k.weightQ6_K[6144 1024]
-
blk.18.attn_output.weightQ6_K[6144 6144]
-
blk.18.attn_q.weightQ6_K[6144 6144]
-
blk.18.attn_v.weightQ6_K[6144 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_down.weightQ6_K[16384 6144]
-
blk.19.ffn_gate.weightQ6_K[6144 16384]
-
blk.19.ffn_up.weightQ6_K[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.attn_k.weightQ6_K[6144 1024]
-
blk.19.attn_output.weightQ6_K[6144 6144]
-
blk.19.attn_q.weightQ6_K[6144 6144]
-
blk.19.attn_v.weightQ6_K[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_down.weightQ6_K[16384 6144]
-
blk.20.ffn_gate.weightQ6_K[6144 16384]
-
blk.20.ffn_up.weightQ6_K[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.attn_k.weightQ6_K[6144 1024]
-
blk.20.attn_output.weightQ6_K[6144 6144]
-
blk.20.attn_q.weightQ6_K[6144 6144]
-
blk.20.attn_v.weightQ6_K[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_down.weightQ6_K[16384 6144]
-
blk.21.ffn_gate.weightQ6_K[6144 16384]
-
blk.21.ffn_up.weightQ6_K[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.attn_k.weightQ6_K[6144 1024]
-
blk.21.attn_output.weightQ6_K[6144 6144]
-
blk.21.attn_q.weightQ6_K[6144 6144]
-
blk.21.attn_v.weightQ6_K[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_down.weightQ6_K[16384 6144]
-
blk.22.ffn_gate.weightQ6_K[6144 16384]
-
blk.22.ffn_up.weightQ6_K[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.attn_k.weightQ6_K[6144 1024]
-
blk.22.attn_output.weightQ6_K[6144 6144]
-
blk.22.attn_q.weightQ6_K[6144 6144]
-
blk.22.attn_v.weightQ6_K[6144 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_down.weightQ6_K[16384 6144]
-
blk.23.ffn_gate.weightQ6_K[6144 16384]
-
blk.23.ffn_up.weightQ6_K[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_k.weightQ6_K[6144 1024]
-
blk.23.attn_output.weightQ6_K[6144 6144]
-
blk.23.attn_q.weightQ6_K[6144 6144]
-
blk.23.attn_v.weightQ6_K[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_down.weightQ6_K[16384 6144]
-
blk.24.ffn_gate.weightQ6_K[6144 16384]
-
blk.24.ffn_up.weightQ6_K[6144 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.attn_k.weightQ6_K[6144 1024]
-
blk.24.attn_output.weightQ6_K[6144 6144]
-
blk.24.attn_q.weightQ6_K[6144 6144]
-
blk.24.attn_v.weightQ6_K[6144 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_down.weightQ6_K[16384 6144]
-
blk.25.ffn_gate.weightQ6_K[6144 16384]
-
blk.25.ffn_up.weightQ6_K[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightQ6_K[6144 1024]
-
blk.25.attn_output.weightQ6_K[6144 6144]
-
blk.25.attn_q.weightQ6_K[6144 6144]
-
blk.25.attn_v.weightQ6_K[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_down.weightQ6_K[16384 6144]
-
blk.26.ffn_gate.weightQ6_K[6144 16384]
-
blk.26.ffn_up.weightQ6_K[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.attn_k.weightQ6_K[6144 1024]
-
blk.26.attn_output.weightQ6_K[6144 6144]
-
blk.26.attn_q.weightQ6_K[6144 6144]
-
blk.26.attn_v.weightQ6_K[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_down.weightQ6_K[16384 6144]
-
blk.27.ffn_gate.weightQ6_K[6144 16384]
-
blk.27.ffn_up.weightQ6_K[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.attn_k.weightQ6_K[6144 1024]
-
blk.27.attn_output.weightQ6_K[6144 6144]
-
blk.27.attn_q.weightQ6_K[6144 6144]
-
blk.27.attn_v.weightQ6_K[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_down.weightQ6_K[16384 6144]
-
blk.28.ffn_gate.weightQ6_K[6144 16384]
-
blk.28.ffn_up.weightQ6_K[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.attn_k.weightQ6_K[6144 1024]
-
blk.28.attn_output.weightQ6_K[6144 6144]
-
blk.28.attn_q.weightQ6_K[6144 6144]
-
blk.28.attn_v.weightQ6_K[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_down.weightQ6_K[16384 6144]
-
blk.29.ffn_gate.weightQ6_K[6144 16384]
-
blk.29.ffn_up.weightQ6_K[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.attn_k.weightQ6_K[6144 1024]
-
blk.29.attn_output.weightQ6_K[6144 6144]
-
blk.29.attn_q.weightQ6_K[6144 6144]
-
blk.29.attn_v.weightQ6_K[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_down.weightQ6_K[16384 6144]
-
blk.30.ffn_gate.weightQ6_K[6144 16384]
-
blk.30.ffn_up.weightQ6_K[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.attn_k.weightQ6_K[6144 1024]
-
blk.30.attn_output.weightQ6_K[6144 6144]
-
blk.30.attn_q.weightQ6_K[6144 6144]
-
blk.30.attn_v.weightQ6_K[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_down.weightQ6_K[16384 6144]
-
blk.31.ffn_gate.weightQ6_K[6144 16384]
-
blk.31.ffn_up.weightQ6_K[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.attn_k.weightQ6_K[6144 1024]
-
blk.31.attn_output.weightQ6_K[6144 6144]
-
blk.31.attn_q.weightQ6_K[6144 6144]
-
blk.31.attn_v.weightQ6_K[6144 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_down.weightQ6_K[16384 6144]
-
blk.32.ffn_gate.weightQ6_K[6144 16384]
-
blk.32.ffn_up.weightQ6_K[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.attn_k.weightQ6_K[6144 1024]
-
blk.32.attn_output.weightQ6_K[6144 6144]
-
blk.32.attn_q.weightQ6_K[6144 6144]
-
blk.32.attn_v.weightQ6_K[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_down.weightQ6_K[16384 6144]
-
blk.33.ffn_gate.weightQ6_K[6144 16384]
-
blk.33.ffn_up.weightQ6_K[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.attn_k.weightQ6_K[6144 1024]
-
blk.33.attn_output.weightQ6_K[6144 6144]
-
blk.33.attn_q.weightQ6_K[6144 6144]
-
blk.33.attn_v.weightQ6_K[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_down.weightQ6_K[16384 6144]
-
blk.34.ffn_gate.weightQ6_K[6144 16384]
-
blk.34.ffn_up.weightQ6_K[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.attn_k.weightQ6_K[6144 1024]
-
blk.34.attn_output.weightQ6_K[6144 6144]
-
blk.34.attn_q.weightQ6_K[6144 6144]
-
blk.34.attn_v.weightQ6_K[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_down.weightQ6_K[16384 6144]
-
blk.35.ffn_gate.weightQ6_K[6144 16384]
-
blk.35.ffn_up.weightQ6_K[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.attn_k.weightQ6_K[6144 1024]
-
blk.35.attn_output.weightQ6_K[6144 6144]
-
blk.35.attn_q.weightQ6_K[6144 6144]
-
blk.35.attn_v.weightQ6_K[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_down.weightQ6_K[16384 6144]
-
blk.36.ffn_gate.weightQ6_K[6144 16384]
-
blk.36.ffn_up.weightQ6_K[6144 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.attn_k.weightQ6_K[6144 1024]
-
blk.36.attn_output.weightQ6_K[6144 6144]
-
blk.36.attn_q.weightQ6_K[6144 6144]
-
blk.36.attn_v.weightQ6_K[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_down.weightQ6_K[16384 6144]
-
blk.37.ffn_gate.weightQ6_K[6144 16384]
-
blk.37.ffn_up.weightQ6_K[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.attn_k.weightQ6_K[6144 1024]
-
blk.37.attn_output.weightQ6_K[6144 6144]
-
blk.37.attn_q.weightQ6_K[6144 6144]
-
blk.37.attn_v.weightQ6_K[6144 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_down.weightQ6_K[16384 6144]
-
blk.38.ffn_gate.weightQ6_K[6144 16384]
-
blk.38.ffn_up.weightQ6_K[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.attn_k.weightQ6_K[6144 1024]
-
blk.38.attn_output.weightQ6_K[6144 6144]
-
blk.38.attn_q.weightQ6_K[6144 6144]
-
blk.38.attn_v.weightQ6_K[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_down.weightQ6_K[16384 6144]
-
blk.39.ffn_gate.weightQ6_K[6144 16384]
-
blk.39.ffn_up.weightQ6_K[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.attn_k.weightQ6_K[6144 1024]
-
blk.39.attn_output.weightQ6_K[6144 6144]
-
blk.39.attn_q.weightQ6_K[6144 6144]
-
blk.39.attn_v.weightQ6_K[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_down.weightQ6_K[16384 6144]
-
blk.40.ffn_gate.weightQ6_K[6144 16384]
-
blk.40.ffn_up.weightQ6_K[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.attn_k.weightQ6_K[6144 1024]
-
blk.40.attn_output.weightQ6_K[6144 6144]
-
blk.40.attn_q.weightQ6_K[6144 6144]
-
blk.40.attn_v.weightQ6_K[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_down.weightQ6_K[16384 6144]
-
blk.41.ffn_gate.weightQ6_K[6144 16384]
-
blk.41.ffn_up.weightQ6_K[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.attn_k.weightQ6_K[6144 1024]
-
blk.41.attn_output.weightQ6_K[6144 6144]
-
blk.41.attn_q.weightQ6_K[6144 6144]
-
blk.41.attn_v.weightQ6_K[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_down.weightQ6_K[16384 6144]
-
blk.42.ffn_gate.weightQ6_K[6144 16384]
-
blk.42.ffn_up.weightQ6_K[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.attn_k.weightQ6_K[6144 1024]
-
blk.42.attn_output.weightQ6_K[6144 6144]
-
blk.42.attn_q.weightQ6_K[6144 6144]
-
blk.42.attn_v.weightQ6_K[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_down.weightQ6_K[16384 6144]
-
blk.43.ffn_gate.weightQ6_K[6144 16384]
-
blk.43.ffn_up.weightQ6_K[6144 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.attn_k.weightQ6_K[6144 1024]
-
blk.43.attn_output.weightQ6_K[6144 6144]
-
blk.43.attn_q.weightQ6_K[6144 6144]
-
blk.43.attn_v.weightQ6_K[6144 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_down.weightQ6_K[16384 6144]
-
blk.44.ffn_gate.weightQ6_K[6144 16384]
-
blk.44.ffn_up.weightQ6_K[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.attn_k.weightQ6_K[6144 1024]
-
blk.44.attn_output.weightQ6_K[6144 6144]
-
blk.44.attn_q.weightQ6_K[6144 6144]
-
blk.44.attn_v.weightQ6_K[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_down.weightQ6_K[16384 6144]
-
blk.45.ffn_gate.weightQ6_K[6144 16384]
-
blk.45.ffn_up.weightQ6_K[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.attn_k.weightQ6_K[6144 1024]
-
blk.45.attn_output.weightQ6_K[6144 6144]
-
blk.45.attn_q.weightQ6_K[6144 6144]
-
blk.45.attn_v.weightQ6_K[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_down.weightQ6_K[16384 6144]
-
blk.46.ffn_gate.weightQ6_K[6144 16384]
-
blk.46.ffn_up.weightQ6_K[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.attn_k.weightQ6_K[6144 1024]
-
blk.46.attn_output.weightQ6_K[6144 6144]
-
blk.46.attn_q.weightQ6_K[6144 6144]
-
blk.46.attn_v.weightQ6_K[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_down.weightQ6_K[16384 6144]
-
blk.47.ffn_gate.weightQ6_K[6144 16384]
-
blk.47.ffn_up.weightQ6_K[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.attn_k.weightQ6_K[6144 1024]
-
blk.47.attn_output.weightQ6_K[6144 6144]
-
blk.47.attn_q.weightQ6_K[6144 6144]
-
blk.47.attn_v.weightQ6_K[6144 1024]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_down.weightQ6_K[16384 6144]
-
blk.48.ffn_gate.weightQ6_K[6144 16384]
-
blk.48.ffn_up.weightQ6_K[6144 16384]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.48.attn_k.weightQ6_K[6144 1024]
-
blk.48.attn_output.weightQ6_K[6144 6144]
-
blk.48.attn_q.weightQ6_K[6144 6144]
-
blk.48.attn_v.weightQ6_K[6144 1024]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_down.weightQ6_K[16384 6144]
-
blk.49.ffn_gate.weightQ6_K[6144 16384]
-
blk.49.ffn_up.weightQ6_K[6144 16384]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.49.attn_k.weightQ6_K[6144 1024]
-
blk.49.attn_output.weightQ6_K[6144 6144]
-
blk.49.attn_q.weightQ6_K[6144 6144]
-
blk.49.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_down.weightQ6_K[16384 6144]
-
blk.50.ffn_gate.weightQ6_K[6144 16384]
-
blk.50.ffn_up.weightQ6_K[6144 16384]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_k.weightQ6_K[6144 1024]
-
blk.50.attn_output.weightQ6_K[6144 6144]
-
blk.50.attn_q.weightQ6_K[6144 6144]
-
blk.50.attn_v.weightQ6_K[6144 1024]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_down.weightQ6_K[16384 6144]
-
blk.51.ffn_gate.weightQ6_K[6144 16384]
-
blk.51.ffn_up.weightQ6_K[6144 16384]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_k.weightQ6_K[6144 1024]
-
blk.51.attn_output.weightQ6_K[6144 6144]
-
blk.51.attn_q.weightQ6_K[6144 6144]
-
blk.51.attn_v.weightQ6_K[6144 1024]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_down.weightQ6_K[16384 6144]
-
blk.52.ffn_gate.weightQ6_K[6144 16384]
-
blk.52.ffn_up.weightQ6_K[6144 16384]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightQ6_K[6144 1024]
-
blk.52.attn_output.weightQ6_K[6144 6144]
-
blk.52.attn_q.weightQ6_K[6144 6144]
-
blk.52.attn_v.weightQ6_K[6144 1024]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_down.weightQ6_K[16384 6144]
-
blk.53.ffn_gate.weightQ6_K[6144 16384]
-
blk.53.ffn_up.weightQ6_K[6144 16384]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.53.attn_k.weightQ6_K[6144 1024]
-
blk.53.attn_output.weightQ6_K[6144 6144]
-
blk.53.attn_q.weightQ6_K[6144 6144]
-
blk.53.attn_v.weightQ6_K[6144 1024]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_down.weightQ6_K[16384 6144]
-
blk.54.ffn_gate.weightQ6_K[6144 16384]
-
blk.54.ffn_up.weightQ6_K[6144 16384]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.54.attn_k.weightQ6_K[6144 1024]
-
blk.54.attn_output.weightQ6_K[6144 6144]
-
blk.54.attn_q.weightQ6_K[6144 6144]
-
blk.54.attn_v.weightQ6_K[6144 1024]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_down.weightQ6_K[16384 6144]
-
blk.55.ffn_gate.weightQ6_K[6144 16384]
-
blk.55.ffn_up.weightQ6_K[6144 16384]
-
blk.55.ffn_norm.weightF32[6144]
-
blk.55.attn_k.weightQ6_K[6144 1024]
-
blk.55.attn_output.weightQ6_K[6144 6144]
-
blk.55.attn_q.weightQ6_K[6144 6144]
-
blk.55.attn_v.weightQ6_K[6144 1024]
-
output.weightQ6_K[6144 32768]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55