I-quants for mistral-large-instruct-2407
Tools
123B
18 Pulls Updated 2 weeks ago
2d405649893a · 28GB
-
quantize.imatrix.chunks_count148
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count616
-
quantize.imatrix.file/models_out/Mistral-Large-Instruct-2407-GGUF/Mistral-Large-Instruct-2407.imatrix
-
general.architecturellama
-
general.file_typeBF16
-
llama.attention.head_count96
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count88
-
llama.context_length131072
-
llama.embedding_length12288
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32768
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 4 4 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[12288 32768]
-
blk.0.attn_norm.weightF32[12288]
-
blk.0.ffn_down.weightQ2_K[28672 12288]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.0.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.0.ffn_norm.weightF32[12288]
-
blk.0.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.0.attn_output.weightI8[12288 12288]
-
blk.0.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.0.attn_v.weightQ4_K[12288 1024]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.1.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.1.attn_output.weightI8[12288 12288]
-
blk.1.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.1.attn_v.weightQ4_K[12288 1024]
-
blk.1.attn_norm.weightF32[12288]
-
blk.1.ffn_down.weightQ2_K[28672 12288]
-
blk.1.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.1.ffn_norm.weightF32[12288]
-
blk.2.attn_norm.weightF32[12288]
-
blk.2.ffn_down.weightQ2_K[28672 12288]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.2.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.2.ffn_norm.weightF32[12288]
-
blk.2.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.2.attn_output.weightI8[12288 12288]
-
blk.2.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.2.attn_v.weightQ4_K[12288 1024]
-
blk.3.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.3.attn_output.weightI8[12288 12288]
-
blk.3.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.3.attn_v.weightQ4_K[12288 1024]
-
blk.3.attn_norm.weightF32[12288]
-
blk.3.ffn_down.weightQ2_K[28672 12288]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.3.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.3.ffn_norm.weightF32[12288]
-
blk.4.attn_norm.weightF32[12288]
-
blk.4.ffn_down.weightQ2_K[28672 12288]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.4.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.4.ffn_norm.weightF32[12288]
-
blk.4.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.4.attn_output.weightI8[12288 12288]
-
blk.4.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.4.attn_v.weightQ4_K[12288 1024]
-
blk.5.attn_norm.weightF32[12288]
-
blk.5.ffn_down.weightQ2_K[28672 12288]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.5.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.5.ffn_norm.weightF32[12288]
-
blk.5.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.5.attn_output.weightI8[12288 12288]
-
blk.5.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.5.attn_v.weightQ4_K[12288 1024]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.6.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.6.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.6.attn_output.weightI8[12288 12288]
-
blk.6.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.6.attn_v.weightQ4_K[12288 1024]
-
blk.6.attn_norm.weightF32[12288]
-
blk.6.ffn_down.weightQ2_K[28672 12288]
-
blk.6.ffn_norm.weightF32[12288]
-
blk.7.attn_norm.weightF32[12288]
-
blk.7.ffn_down.weightQ2_K[28672 12288]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.7.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.7.ffn_norm.weightF32[12288]
-
blk.7.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.7.attn_output.weightI8[12288 12288]
-
blk.7.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.7.attn_v.weightQ4_K[12288 1024]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.8.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.8.attn_output.weightI8[12288 12288]
-
blk.8.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.8.attn_v.weightQ4_K[12288 1024]
-
blk.8.attn_norm.weightF32[12288]
-
blk.8.ffn_down.weightQ2_K[28672 12288]
-
blk.8.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.8.ffn_norm.weightF32[12288]
-
blk.9.attn_norm.weightF32[12288]
-
blk.9.ffn_down.weightQ2_K[28672 12288]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.9.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.9.ffn_norm.weightF32[12288]
-
blk.9.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.9.attn_output.weightI8[12288 12288]
-
blk.9.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.9.attn_v.weightQ4_K[12288 1024]
-
blk.10.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.10.attn_output.weightI8[12288 12288]
-
blk.10.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.10.attn_v.weightQ4_K[12288 1024]
-
blk.10.attn_norm.weightF32[12288]
-
blk.10.ffn_down.weightQ2_K[28672 12288]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.10.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.10.ffn_norm.weightF32[12288]
-
blk.11.attn_norm.weightF32[12288]
-
blk.11.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.11.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.11.ffn_norm.weightF32[12288]
-
blk.11.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.11.attn_output.weightI8[12288 12288]
-
blk.11.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.11.attn_v.weightQ4_K[12288 1024]
-
blk.12.attn_norm.weightF32[12288]
-
blk.12.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.12.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.12.ffn_norm.weightF32[12288]
-
blk.12.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.12.attn_output.weightI8[12288 12288]
-
blk.12.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.12.attn_v.weightQ4_K[12288 1024]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.13.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.13.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.13.attn_output.weightI8[12288 12288]
-
blk.13.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.13.attn_v.weightQ4_K[12288 1024]
-
blk.13.attn_norm.weightF32[12288]
-
blk.13.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.13.ffn_norm.weightF32[12288]
-
blk.14.attn_norm.weightF32[12288]
-
blk.14.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.14.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.14.ffn_norm.weightF32[12288]
-
blk.14.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.14.attn_output.weightI8[12288 12288]
-
blk.14.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.14.attn_v.weightQ4_K[12288 1024]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.15.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.15.attn_output.weightI8[12288 12288]
-
blk.15.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.15.attn_v.weightQ4_K[12288 1024]
-
blk.15.attn_norm.weightF32[12288]
-
blk.15.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.15.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.15.ffn_norm.weightF32[12288]
-
blk.16.attn_norm.weightF32[12288]
-
blk.16.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.16.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.16.ffn_norm.weightF32[12288]
-
blk.16.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.16.attn_output.weightI8[12288 12288]
-
blk.16.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.16.attn_v.weightQ4_K[12288 1024]
-
blk.17.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.17.attn_output.weightI8[12288 12288]
-
blk.17.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.17.attn_v.weightQ4_K[12288 1024]
-
blk.17.attn_norm.weightF32[12288]
-
blk.17.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.17.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.17.ffn_norm.weightF32[12288]
-
blk.18.attn_norm.weightF32[12288]
-
blk.18.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.18.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.18.ffn_norm.weightF32[12288]
-
blk.18.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.18.attn_output.weightI8[12288 12288]
-
blk.18.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.18.attn_v.weightQ4_K[12288 1024]
-
blk.19.attn_norm.weightF32[12288]
-
blk.19.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.19.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.19.ffn_norm.weightF32[12288]
-
blk.19.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.19.attn_output.weightI8[12288 12288]
-
blk.19.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.19.attn_v.weightQ4_K[12288 1024]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.20.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.20.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.20.attn_output.weightI8[12288 12288]
-
blk.20.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.20.attn_v.weightQ4_K[12288 1024]
-
blk.20.attn_norm.weightF32[12288]
-
blk.20.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.20.ffn_norm.weightF32[12288]
-
blk.21.attn_norm.weightF32[12288]
-
blk.21.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.21.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.21.ffn_norm.weightF32[12288]
-
blk.21.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.21.attn_output.weightI8[12288 12288]
-
blk.21.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.21.attn_v.weightQ4_K[12288 1024]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.22.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.22.attn_output.weightI8[12288 12288]
-
blk.22.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.22.attn_v.weightQ4_K[12288 1024]
-
blk.22.attn_norm.weightF32[12288]
-
blk.22.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.22.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.22.ffn_norm.weightF32[12288]
-
blk.23.attn_norm.weightF32[12288]
-
blk.23.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.23.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.23.ffn_norm.weightF32[12288]
-
blk.23.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.23.attn_output.weightI8[12288 12288]
-
blk.23.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.23.attn_v.weightQ4_K[12288 1024]
-
blk.24.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.24.attn_output.weightI8[12288 12288]
-
blk.24.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.24.attn_v.weightQ4_K[12288 1024]
-
blk.24.attn_norm.weightF32[12288]
-
blk.24.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.24.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.24.ffn_norm.weightF32[12288]
-
blk.25.attn_norm.weightF32[12288]
-
blk.25.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.25.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.25.ffn_norm.weightF32[12288]
-
blk.25.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.25.attn_output.weightI8[12288 12288]
-
blk.25.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.25.attn_v.weightQ4_K[12288 1024]
-
blk.26.attn_norm.weightF32[12288]
-
blk.26.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.26.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.26.ffn_norm.weightF32[12288]
-
blk.26.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.26.attn_output.weightI8[12288 12288]
-
blk.26.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.26.attn_v.weightQ4_K[12288 1024]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.27.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.27.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.27.attn_output.weightI8[12288 12288]
-
blk.27.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.27.attn_v.weightQ4_K[12288 1024]
-
blk.27.attn_norm.weightF32[12288]
-
blk.27.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.27.ffn_norm.weightF32[12288]
-
blk.28.attn_norm.weightF32[12288]
-
blk.28.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.28.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.28.ffn_norm.weightF32[12288]
-
blk.28.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.28.attn_output.weightI8[12288 12288]
-
blk.28.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.28.attn_v.weightQ4_K[12288 1024]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.29.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.29.attn_output.weightI8[12288 12288]
-
blk.29.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.29.attn_v.weightQ4_K[12288 1024]
-
blk.29.attn_norm.weightF32[12288]
-
blk.29.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.29.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.29.ffn_norm.weightF32[12288]
-
blk.30.attn_norm.weightF32[12288]
-
blk.30.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.30.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.30.ffn_norm.weightF32[12288]
-
blk.30.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.30.attn_output.weightI8[12288 12288]
-
blk.30.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.30.attn_v.weightQ4_K[12288 1024]
-
blk.31.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.31.attn_output.weightI8[12288 12288]
-
blk.31.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.31.attn_v.weightQ4_K[12288 1024]
-
blk.31.attn_norm.weightF32[12288]
-
blk.31.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.31.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.31.ffn_norm.weightF32[12288]
-
blk.32.attn_norm.weightF32[12288]
-
blk.32.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.32.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.32.ffn_norm.weightF32[12288]
-
blk.32.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.32.attn_output.weightI8[12288 12288]
-
blk.32.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.32.attn_v.weightQ4_K[12288 1024]
-
blk.33.attn_norm.weightF32[12288]
-
blk.33.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.33.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.33.ffn_norm.weightF32[12288]
-
blk.33.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.33.attn_output.weightI8[12288 12288]
-
blk.33.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.33.attn_v.weightQ4_K[12288 1024]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.34.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.34.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.34.attn_output.weightI8[12288 12288]
-
blk.34.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.34.attn_v.weightQ4_K[12288 1024]
-
blk.34.attn_norm.weightF32[12288]
-
blk.34.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.34.ffn_norm.weightF32[12288]
-
blk.35.attn_norm.weightF32[12288]
-
blk.35.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.35.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.35.ffn_norm.weightF32[12288]
-
blk.35.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.35.attn_output.weightI8[12288 12288]
-
blk.35.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.35.attn_v.weightQ4_K[12288 1024]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.36.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.36.attn_output.weightI8[12288 12288]
-
blk.36.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.36.attn_v.weightQ4_K[12288 1024]
-
blk.36.attn_norm.weightF32[12288]
-
blk.36.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.36.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.36.ffn_norm.weightF32[12288]
-
blk.37.attn_norm.weightF32[12288]
-
blk.37.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.37.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.37.ffn_norm.weightF32[12288]
-
blk.37.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.37.attn_output.weightI8[12288 12288]
-
blk.37.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.37.attn_v.weightQ4_K[12288 1024]
-
blk.38.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.38.attn_output.weightI8[12288 12288]
-
blk.38.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.38.attn_v.weightQ4_K[12288 1024]
-
blk.38.attn_norm.weightF32[12288]
-
blk.38.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.38.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.38.ffn_norm.weightF32[12288]
-
blk.39.attn_norm.weightF32[12288]
-
blk.39.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.39.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.39.ffn_norm.weightF32[12288]
-
blk.39.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.39.attn_output.weightI8[12288 12288]
-
blk.39.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.39.attn_v.weightQ4_K[12288 1024]
-
blk.40.attn_norm.weightF32[12288]
-
blk.40.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.40.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.40.ffn_norm.weightF32[12288]
-
blk.40.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.40.attn_output.weightI8[12288 12288]
-
blk.40.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.40.attn_v.weightQ4_K[12288 1024]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.41.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.41.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.41.attn_output.weightI8[12288 12288]
-
blk.41.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.41.attn_v.weightQ4_K[12288 1024]
-
blk.41.attn_norm.weightF32[12288]
-
blk.41.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.41.ffn_norm.weightF32[12288]
-
blk.42.attn_norm.weightF32[12288]
-
blk.42.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.42.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.42.ffn_norm.weightF32[12288]
-
blk.42.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.42.attn_output.weightI8[12288 12288]
-
blk.42.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.42.attn_v.weightQ4_K[12288 1024]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.43.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.43.attn_output.weightI8[12288 12288]
-
blk.43.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.43.attn_v.weightQ4_K[12288 1024]
-
blk.43.attn_norm.weightF32[12288]
-
blk.43.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.43.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.43.ffn_norm.weightF32[12288]
-
blk.44.attn_norm.weightF32[12288]
-
blk.44.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.44.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.44.ffn_norm.weightF32[12288]
-
blk.44.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.44.attn_output.weightI8[12288 12288]
-
blk.44.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.44.attn_v.weightQ4_K[12288 1024]
-
blk.45.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.45.attn_output.weightI8[12288 12288]
-
blk.45.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.45.attn_v.weightQ4_K[12288 1024]
-
blk.45.attn_norm.weightF32[12288]
-
blk.45.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.45.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.45.ffn_norm.weightF32[12288]
-
blk.46.attn_norm.weightF32[12288]
-
blk.46.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.46.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.46.ffn_norm.weightF32[12288]
-
blk.46.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.46.attn_output.weightI8[12288 12288]
-
blk.46.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.46.attn_v.weightQ4_K[12288 1024]
-
blk.47.attn_norm.weightF32[12288]
-
blk.47.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.47.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.47.ffn_norm.weightF32[12288]
-
blk.47.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.47.attn_output.weightI8[12288 12288]
-
blk.47.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.47.attn_v.weightQ4_K[12288 1024]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.48.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.48.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.48.attn_output.weightI8[12288 12288]
-
blk.48.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.48.attn_v.weightQ4_K[12288 1024]
-
blk.48.attn_norm.weightF32[12288]
-
blk.48.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.48.ffn_norm.weightF32[12288]
-
blk.49.attn_norm.weightF32[12288]
-
blk.49.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.49.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.49.ffn_norm.weightF32[12288]
-
blk.49.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.49.attn_output.weightI8[12288 12288]
-
blk.49.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.49.attn_v.weightQ4_K[12288 1024]
-
blk.50.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.50.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.50.attn_output.weightI8[12288 12288]
-
blk.50.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.50.attn_v.weightQ4_K[12288 1024]
-
blk.50.attn_norm.weightF32[12288]
-
blk.50.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.50.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.50.ffn_norm.weightF32[12288]
-
blk.51.attn_norm.weightF32[12288]
-
blk.51.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.51.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.51.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.51.ffn_norm.weightF32[12288]
-
blk.51.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.51.attn_output.weightI8[12288 12288]
-
blk.51.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.51.attn_v.weightQ4_K[12288 1024]
-
blk.52.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.52.attn_output.weightI8[12288 12288]
-
blk.52.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.52.attn_v.weightQ4_K[12288 1024]
-
blk.52.attn_norm.weightF32[12288]
-
blk.52.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.52.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.52.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.52.ffn_norm.weightF32[12288]
-
blk.53.attn_norm.weightF32[12288]
-
blk.53.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.53.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.53.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.53.ffn_norm.weightF32[12288]
-
blk.53.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.53.attn_output.weightI8[12288 12288]
-
blk.53.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.53.attn_v.weightQ4_K[12288 1024]
-
blk.54.attn_norm.weightF32[12288]
-
blk.54.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.54.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.54.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.54.ffn_norm.weightF32[12288]
-
blk.54.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.54.attn_output.weightI8[12288 12288]
-
blk.54.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.54.attn_v.weightQ4_K[12288 1024]
-
blk.55.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.55.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.55.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.55.attn_output.weightI8[12288 12288]
-
blk.55.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.55.attn_v.weightQ4_K[12288 1024]
-
blk.55.attn_norm.weightF32[12288]
-
blk.55.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.55.ffn_norm.weightF32[12288]
-
blk.56.attn_norm.weightF32[12288]
-
blk.56.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.56.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.56.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.56.ffn_norm.weightF32[12288]
-
blk.56.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.56.attn_output.weightI8[12288 12288]
-
blk.56.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.56.attn_v.weightQ4_K[12288 1024]
-
blk.57.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.57.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.57.attn_output.weightI8[12288 12288]
-
blk.57.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.57.attn_v.weightQ4_K[12288 1024]
-
blk.57.attn_norm.weightF32[12288]
-
blk.57.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.57.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.57.ffn_norm.weightF32[12288]
-
blk.58.attn_norm.weightF32[12288]
-
blk.58.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.58.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.58.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.58.ffn_norm.weightF32[12288]
-
blk.58.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.58.attn_output.weightI8[12288 12288]
-
blk.58.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.58.attn_v.weightQ4_K[12288 1024]
-
blk.59.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.59.attn_output.weightI8[12288 12288]
-
blk.59.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.59.attn_v.weightQ4_K[12288 1024]
-
blk.59.attn_norm.weightF32[12288]
-
blk.59.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.59.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.59.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.59.ffn_norm.weightF32[12288]
-
blk.60.attn_norm.weightF32[12288]
-
blk.60.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.60.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.60.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.60.ffn_norm.weightF32[12288]
-
blk.60.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.60.attn_output.weightI8[12288 12288]
-
blk.60.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.60.attn_v.weightQ4_K[12288 1024]
-
blk.61.attn_norm.weightF32[12288]
-
blk.61.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.61.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.61.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.61.ffn_norm.weightF32[12288]
-
blk.61.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.61.attn_output.weightI8[12288 12288]
-
blk.61.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.61.attn_v.weightQ4_K[12288 1024]
-
blk.62.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.62.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.62.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.62.attn_output.weightI8[12288 12288]
-
blk.62.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.62.attn_v.weightQ4_K[12288 1024]
-
blk.62.attn_norm.weightF32[12288]
-
blk.62.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.62.ffn_norm.weightF32[12288]
-
blk.63.attn_norm.weightF32[12288]
-
blk.63.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.63.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.63.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.63.ffn_norm.weightF32[12288]
-
blk.63.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.63.attn_output.weightI8[12288 12288]
-
blk.63.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.63.attn_v.weightQ4_K[12288 1024]
-
blk.64.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.64.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.64.attn_output.weightI8[12288 12288]
-
blk.64.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.64.attn_v.weightQ4_K[12288 1024]
-
blk.64.attn_norm.weightF32[12288]
-
blk.64.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.64.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.64.ffn_norm.weightF32[12288]
-
blk.65.attn_norm.weightF32[12288]
-
blk.65.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.65.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.65.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.65.ffn_norm.weightF32[12288]
-
blk.65.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.65.attn_output.weightI8[12288 12288]
-
blk.65.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.65.attn_v.weightQ4_K[12288 1024]
-
blk.66.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.66.attn_output.weightI8[12288 12288]
-
blk.66.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.66.attn_v.weightQ4_K[12288 1024]
-
blk.66.attn_norm.weightF32[12288]
-
blk.66.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.66.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.66.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.66.ffn_norm.weightF32[12288]
-
blk.67.attn_norm.weightF32[12288]
-
blk.67.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.67.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.67.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.67.ffn_norm.weightF32[12288]
-
blk.67.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.67.attn_output.weightI8[12288 12288]
-
blk.67.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.67.attn_v.weightQ4_K[12288 1024]
-
blk.68.attn_norm.weightF32[12288]
-
blk.68.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.68.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.68.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.68.ffn_norm.weightF32[12288]
-
blk.68.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.68.attn_output.weightI8[12288 12288]
-
blk.68.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.68.attn_v.weightQ4_K[12288 1024]
-
blk.69.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.69.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.69.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.69.attn_output.weightI8[12288 12288]
-
blk.69.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.69.attn_v.weightQ4_K[12288 1024]
-
blk.69.attn_norm.weightF32[12288]
-
blk.69.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.69.ffn_norm.weightF32[12288]
-
blk.70.attn_norm.weightF32[12288]
-
blk.70.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.70.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.70.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.70.ffn_norm.weightF32[12288]
-
blk.70.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.70.attn_output.weightI8[12288 12288]
-
blk.70.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.70.attn_v.weightQ4_K[12288 1024]
-
blk.71.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.71.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.71.attn_output.weightI8[12288 12288]
-
blk.71.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.71.attn_v.weightQ4_K[12288 1024]
-
blk.71.attn_norm.weightF32[12288]
-
blk.71.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.71.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.71.ffn_norm.weightF32[12288]
-
blk.72.attn_norm.weightF32[12288]
-
blk.72.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.72.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.72.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.72.ffn_norm.weightF32[12288]
-
blk.72.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.72.attn_output.weightI8[12288 12288]
-
blk.72.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.72.attn_v.weightQ4_K[12288 1024]
-
blk.73.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.73.attn_output.weightI8[12288 12288]
-
blk.73.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.73.attn_v.weightQ4_K[12288 1024]
-
blk.73.attn_norm.weightF32[12288]
-
blk.73.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.73.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.73.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.73.ffn_norm.weightF32[12288]
-
blk.74.attn_norm.weightF32[12288]
-
blk.74.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.74.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.74.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.74.ffn_norm.weightF32[12288]
-
blk.74.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.74.attn_output.weightI8[12288 12288]
-
blk.74.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.74.attn_v.weightQ4_K[12288 1024]
-
blk.75.attn_norm.weightF32[12288]
-
blk.75.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.75.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.75.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.75.ffn_norm.weightF32[12288]
-
blk.75.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.75.attn_output.weightI8[12288 12288]
-
blk.75.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.75.attn_v.weightQ4_K[12288 1024]
-
blk.76.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.76.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.76.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.76.attn_output.weightI8[12288 12288]
-
blk.76.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.76.attn_v.weightQ4_K[12288 1024]
-
blk.76.attn_norm.weightF32[12288]
-
blk.76.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.76.ffn_norm.weightF32[12288]
-
blk.77.attn_norm.weightF32[12288]
-
blk.77.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.77.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.77.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.77.ffn_norm.weightF32[12288]
-
blk.77.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.77.attn_output.weightI8[12288 12288]
-
blk.77.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.77.attn_v.weightQ4_K[12288 1024]
-
blk.78.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.78.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.78.attn_output.weightI8[12288 12288]
-
blk.78.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.78.attn_v.weightQ4_K[12288 1024]
-
blk.78.attn_norm.weightF32[12288]
-
blk.78.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.78.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.78.ffn_norm.weightF32[12288]
-
blk.79.attn_norm.weightF32[12288]
-
blk.79.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.79.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.79.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.79.ffn_norm.weightF32[12288]
-
blk.79.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.79.attn_output.weightI8[12288 12288]
-
blk.79.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.79.attn_v.weightQ4_K[12288 1024]
-
blk.80.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.80.attn_output.weightI8[12288 12288]
-
blk.80.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.80.attn_v.weightQ4_K[12288 1024]
-
blk.80.attn_norm.weightF32[12288]
-
blk.80.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.80.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.80.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.80.ffn_norm.weightF32[12288]
-
blk.81.attn_norm.weightF32[12288]
-
blk.81.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.81.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.81.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.81.ffn_norm.weightF32[12288]
-
blk.81.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.81.attn_output.weightI8[12288 12288]
-
blk.81.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.81.attn_v.weightQ4_K[12288 1024]
-
blk.82.attn_norm.weightF32[12288]
-
blk.82.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.82.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.82.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.82.ffn_norm.weightF32[12288]
-
blk.82.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.82.attn_output.weightI8[12288 12288]
-
blk.82.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.82.attn_v.weightQ4_K[12288 1024]
-
blk.83.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.83.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.83.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.83.attn_output.weightI8[12288 12288]
-
blk.83.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.83.attn_v.weightQ4_K[12288 1024]
-
blk.83.attn_norm.weightF32[12288]
-
blk.83.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.83.ffn_norm.weightF32[12288]
-
blk.84.attn_norm.weightF32[12288]
-
blk.84.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.84.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.84.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.84.ffn_norm.weightF32[12288]
-
blk.84.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.84.attn_output.weightI8[12288 12288]
-
blk.84.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.84.attn_v.weightQ4_K[12288 1024]
-
blk.85.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.85.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.85.attn_output.weightI8[12288 12288]
-
blk.85.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.85.attn_v.weightQ4_K[12288 1024]
-
blk.85.attn_norm.weightF32[12288]
-
blk.85.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.85.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.85.ffn_norm.weightF32[12288]
-
blk.86.attn_norm.weightF32[12288]
-
blk.86.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.86.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.86.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.86.ffn_norm.weightF32[12288]
-
blk.86.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.86.attn_output.weightI8[12288 12288]
-
blk.86.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.86.attn_v.weightQ4_K[12288 1024]
-
blk.87.attn_k.weight(!unknown_type 29!)[12288 1024]
-
blk.87.attn_output.weightI8[12288 12288]
-
blk.87.attn_q.weight(!unknown_type 29!)[12288 12288]
-
blk.87.attn_v.weightQ4_K[12288 1024]
-
blk.87.attn_norm.weightF32[12288]
-
blk.87.ffn_down.weight(!unknown_type 29!)[28672 12288]
-
blk.87.ffn_gate.weight(!unknown_type 29!)[12288 28672]
-
blk.87.ffn_up.weight(!unknown_type 29!)[12288 28672]
-
blk.87.ffn_norm.weightF32[12288]
-
output.weightQ5_K[12288 32768]
-
output_norm.weightF32[12288]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85
blk.86
blk.87