I-quants for mistral-large-instruct-2407
Tools
123B
18 Pulls Updated 2 weeks ago
992bf07a14a6 · 47GB
-
quantize.imatrix.chunks_count148
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count616
-
quantize.imatrix.file/models_out/Mistral-Large-Instruct-2407-GGUF/Mistral-Large-Instruct-2407.imatrix
-
general.architecturellama
-
general.file_typeIQ3_XXS
-
llama.attention.head_count96
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count88
-
llama.context_length131072
-
llama.embedding_length12288
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32768
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 4 4 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[12288 32768]
-
blk.0.attn_norm.weightF32[12288]
-
blk.0.ffn_down.weightI32[28672 12288]
-
blk.0.ffn_gate.weightI32[12288 28672]
-
blk.0.ffn_up.weightI32[12288 28672]
-
blk.0.ffn_norm.weightF32[12288]
-
blk.0.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.0.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.0.attn_v.weightQ4_K[12288 1024]
-
blk.1.ffn_gate.weightI32[12288 28672]
-
blk.1.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.1.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.1.attn_v.weightQ4_K[12288 1024]
-
blk.1.attn_norm.weightF32[12288]
-
blk.1.ffn_down.weightI32[28672 12288]
-
blk.1.ffn_up.weightI32[12288 28672]
-
blk.1.ffn_norm.weightF32[12288]
-
blk.2.attn_norm.weightF32[12288]
-
blk.2.ffn_down.weightI32[28672 12288]
-
blk.2.ffn_gate.weightI32[12288 28672]
-
blk.2.ffn_up.weightI32[12288 28672]
-
blk.2.ffn_norm.weightF32[12288]
-
blk.2.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.2.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.2.attn_v.weightQ4_K[12288 1024]
-
blk.3.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.3.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.3.attn_v.weightQ4_K[12288 1024]
-
blk.3.attn_norm.weightF32[12288]
-
blk.3.ffn_down.weightI32[28672 12288]
-
blk.3.ffn_gate.weightI32[12288 28672]
-
blk.3.ffn_up.weightI32[12288 28672]
-
blk.3.ffn_norm.weightF32[12288]
-
blk.4.attn_norm.weightF32[12288]
-
blk.4.ffn_down.weightI32[28672 12288]
-
blk.4.ffn_gate.weightI32[12288 28672]
-
blk.4.ffn_up.weightI32[12288 28672]
-
blk.4.ffn_norm.weightF32[12288]
-
blk.4.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.4.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.4.attn_v.weightQ4_K[12288 1024]
-
blk.5.attn_norm.weightF32[12288]
-
blk.5.ffn_down.weightI32[28672 12288]
-
blk.5.ffn_gate.weightI32[12288 28672]
-
blk.5.ffn_up.weightI32[12288 28672]
-
blk.5.ffn_norm.weightF32[12288]
-
blk.5.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.5.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.5.attn_v.weightQ4_K[12288 1024]
-
blk.6.ffn_gate.weightI32[12288 28672]
-
blk.6.ffn_up.weightI32[12288 28672]
-
blk.6.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.6.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.6.attn_v.weightQ4_K[12288 1024]
-
blk.6.attn_norm.weightF32[12288]
-
blk.6.ffn_down.weightI32[28672 12288]
-
blk.6.ffn_norm.weightF32[12288]
-
blk.7.attn_norm.weightF32[12288]
-
blk.7.ffn_down.weightI32[28672 12288]
-
blk.7.ffn_gate.weightI32[12288 28672]
-
blk.7.ffn_up.weightI32[12288 28672]
-
blk.7.ffn_norm.weightF32[12288]
-
blk.7.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.7.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.7.attn_v.weightQ4_K[12288 1024]
-
blk.8.ffn_gate.weightI32[12288 28672]
-
blk.8.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.8.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.8.attn_v.weightQ4_K[12288 1024]
-
blk.8.attn_norm.weightF32[12288]
-
blk.8.ffn_down.weightI32[28672 12288]
-
blk.8.ffn_up.weightI32[12288 28672]
-
blk.8.ffn_norm.weightF32[12288]
-
blk.9.attn_norm.weightF32[12288]
-
blk.9.ffn_down.weightI32[28672 12288]
-
blk.9.ffn_gate.weightI32[12288 28672]
-
blk.9.ffn_up.weightI32[12288 28672]
-
blk.9.ffn_norm.weightF32[12288]
-
blk.9.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.9.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.9.attn_v.weightQ4_K[12288 1024]
-
blk.10.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.10.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.10.attn_v.weightQ4_K[12288 1024]
-
blk.10.attn_norm.weightF32[12288]
-
blk.10.ffn_down.weightI32[28672 12288]
-
blk.10.ffn_gate.weightI32[12288 28672]
-
blk.10.ffn_up.weightI32[12288 28672]
-
blk.10.ffn_norm.weightF32[12288]
-
blk.11.attn_norm.weightF32[12288]
-
blk.11.ffn_down.weightI32[28672 12288]
-
blk.11.ffn_gate.weightI32[12288 28672]
-
blk.11.ffn_up.weightI32[12288 28672]
-
blk.11.ffn_norm.weightF32[12288]
-
blk.11.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.11.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.11.attn_v.weightQ4_K[12288 1024]
-
blk.12.attn_norm.weightF32[12288]
-
blk.12.ffn_down.weightI32[28672 12288]
-
blk.12.ffn_gate.weightI32[12288 28672]
-
blk.12.ffn_up.weightI32[12288 28672]
-
blk.12.ffn_norm.weightF32[12288]
-
blk.12.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.12.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.12.attn_v.weightQ4_K[12288 1024]
-
blk.13.ffn_gate.weightI32[12288 28672]
-
blk.13.ffn_up.weightI32[12288 28672]
-
blk.13.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.13.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.13.attn_v.weightQ4_K[12288 1024]
-
blk.13.attn_norm.weightF32[12288]
-
blk.13.ffn_down.weightI32[28672 12288]
-
blk.13.ffn_norm.weightF32[12288]
-
blk.14.attn_norm.weightF32[12288]
-
blk.14.ffn_down.weightI32[28672 12288]
-
blk.14.ffn_gate.weightI32[12288 28672]
-
blk.14.ffn_up.weightI32[12288 28672]
-
blk.14.ffn_norm.weightF32[12288]
-
blk.14.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.14.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.14.attn_v.weightQ4_K[12288 1024]
-
blk.15.ffn_gate.weightI32[12288 28672]
-
blk.15.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.15.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.15.attn_v.weightQ4_K[12288 1024]
-
blk.15.attn_norm.weightF32[12288]
-
blk.15.ffn_down.weightI32[28672 12288]
-
blk.15.ffn_up.weightI32[12288 28672]
-
blk.15.ffn_norm.weightF32[12288]
-
blk.16.attn_norm.weightF32[12288]
-
blk.16.ffn_down.weightI32[28672 12288]
-
blk.16.ffn_gate.weightI32[12288 28672]
-
blk.16.ffn_up.weightI32[12288 28672]
-
blk.16.ffn_norm.weightF32[12288]
-
blk.16.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.16.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.16.attn_v.weightQ4_K[12288 1024]
-
blk.17.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.17.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.17.attn_v.weightQ4_K[12288 1024]
-
blk.17.attn_norm.weightF32[12288]
-
blk.17.ffn_down.weightI32[28672 12288]
-
blk.17.ffn_gate.weightI32[12288 28672]
-
blk.17.ffn_up.weightI32[12288 28672]
-
blk.17.ffn_norm.weightF32[12288]
-
blk.18.attn_norm.weightF32[12288]
-
blk.18.ffn_down.weightI32[28672 12288]
-
blk.18.ffn_gate.weightI32[12288 28672]
-
blk.18.ffn_up.weightI32[12288 28672]
-
blk.18.ffn_norm.weightF32[12288]
-
blk.18.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.18.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.18.attn_v.weightQ4_K[12288 1024]
-
blk.19.attn_norm.weightF32[12288]
-
blk.19.ffn_down.weightI32[28672 12288]
-
blk.19.ffn_gate.weightI32[12288 28672]
-
blk.19.ffn_up.weightI32[12288 28672]
-
blk.19.ffn_norm.weightF32[12288]
-
blk.19.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.19.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.19.attn_v.weightQ4_K[12288 1024]
-
blk.20.ffn_gate.weightI32[12288 28672]
-
blk.20.ffn_up.weightI32[12288 28672]
-
blk.20.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.20.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.20.attn_v.weightQ4_K[12288 1024]
-
blk.20.attn_norm.weightF32[12288]
-
blk.20.ffn_down.weightI32[28672 12288]
-
blk.20.ffn_norm.weightF32[12288]
-
blk.21.attn_norm.weightF32[12288]
-
blk.21.ffn_down.weightI32[28672 12288]
-
blk.21.ffn_gate.weightI32[12288 28672]
-
blk.21.ffn_up.weightI32[12288 28672]
-
blk.21.ffn_norm.weightF32[12288]
-
blk.21.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.21.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.21.attn_v.weightQ4_K[12288 1024]
-
blk.22.ffn_gate.weightI32[12288 28672]
-
blk.22.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.22.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.22.attn_v.weightQ4_K[12288 1024]
-
blk.22.attn_norm.weightF32[12288]
-
blk.22.ffn_down.weightI32[28672 12288]
-
blk.22.ffn_up.weightI32[12288 28672]
-
blk.22.ffn_norm.weightF32[12288]
-
blk.23.attn_norm.weightF32[12288]
-
blk.23.ffn_down.weightI32[28672 12288]
-
blk.23.ffn_gate.weightI32[12288 28672]
-
blk.23.ffn_up.weightI32[12288 28672]
-
blk.23.ffn_norm.weightF32[12288]
-
blk.23.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.23.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.23.attn_v.weightQ4_K[12288 1024]
-
blk.24.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.24.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.24.attn_v.weightQ4_K[12288 1024]
-
blk.24.attn_norm.weightF32[12288]
-
blk.24.ffn_down.weightI32[28672 12288]
-
blk.24.ffn_gate.weightI32[12288 28672]
-
blk.24.ffn_up.weightI32[12288 28672]
-
blk.24.ffn_norm.weightF32[12288]
-
blk.25.attn_norm.weightF32[12288]
-
blk.25.ffn_down.weightI32[28672 12288]
-
blk.25.ffn_gate.weightI32[12288 28672]
-
blk.25.ffn_up.weightI32[12288 28672]
-
blk.25.ffn_norm.weightF32[12288]
-
blk.25.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.25.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.25.attn_v.weightQ4_K[12288 1024]
-
blk.26.attn_norm.weightF32[12288]
-
blk.26.ffn_down.weightI32[28672 12288]
-
blk.26.ffn_gate.weightI32[12288 28672]
-
blk.26.ffn_up.weightI32[12288 28672]
-
blk.26.ffn_norm.weightF32[12288]
-
blk.26.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.26.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.26.attn_v.weightQ4_K[12288 1024]
-
blk.27.ffn_gate.weightI32[12288 28672]
-
blk.27.ffn_up.weightI32[12288 28672]
-
blk.27.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.27.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.27.attn_v.weightQ4_K[12288 1024]
-
blk.27.attn_norm.weightF32[12288]
-
blk.27.ffn_down.weightI32[28672 12288]
-
blk.27.ffn_norm.weightF32[12288]
-
blk.28.attn_norm.weightF32[12288]
-
blk.28.ffn_down.weightI32[28672 12288]
-
blk.28.ffn_gate.weightI32[12288 28672]
-
blk.28.ffn_up.weightI32[12288 28672]
-
blk.28.ffn_norm.weightF32[12288]
-
blk.28.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.28.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.28.attn_v.weightQ4_K[12288 1024]
-
blk.29.ffn_gate.weightI32[12288 28672]
-
blk.29.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.29.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.29.attn_v.weightQ4_K[12288 1024]
-
blk.29.attn_norm.weightF32[12288]
-
blk.29.ffn_down.weightI32[28672 12288]
-
blk.29.ffn_up.weightI32[12288 28672]
-
blk.29.ffn_norm.weightF32[12288]
-
blk.30.attn_norm.weightF32[12288]
-
blk.30.ffn_down.weightI32[28672 12288]
-
blk.30.ffn_gate.weightI32[12288 28672]
-
blk.30.ffn_up.weightI32[12288 28672]
-
blk.30.ffn_norm.weightF32[12288]
-
blk.30.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.30.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.30.attn_v.weightQ4_K[12288 1024]
-
blk.31.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.31.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.31.attn_v.weightQ4_K[12288 1024]
-
blk.31.attn_norm.weightF32[12288]
-
blk.31.ffn_down.weightI32[28672 12288]
-
blk.31.ffn_gate.weightI32[12288 28672]
-
blk.31.ffn_up.weightI32[12288 28672]
-
blk.31.ffn_norm.weightF32[12288]
-
blk.32.attn_norm.weightF32[12288]
-
blk.32.ffn_down.weightI32[28672 12288]
-
blk.32.ffn_gate.weightI32[12288 28672]
-
blk.32.ffn_up.weightI32[12288 28672]
-
blk.32.ffn_norm.weightF32[12288]
-
blk.32.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.32.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.32.attn_v.weightQ4_K[12288 1024]
-
blk.33.attn_norm.weightF32[12288]
-
blk.33.ffn_down.weightI32[28672 12288]
-
blk.33.ffn_gate.weightI32[12288 28672]
-
blk.33.ffn_up.weightI32[12288 28672]
-
blk.33.ffn_norm.weightF32[12288]
-
blk.33.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.33.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.33.attn_v.weightQ4_K[12288 1024]
-
blk.34.ffn_gate.weightI32[12288 28672]
-
blk.34.ffn_up.weightI32[12288 28672]
-
blk.34.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.34.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.34.attn_v.weightQ4_K[12288 1024]
-
blk.34.attn_norm.weightF32[12288]
-
blk.34.ffn_down.weightI32[28672 12288]
-
blk.34.ffn_norm.weightF32[12288]
-
blk.35.attn_norm.weightF32[12288]
-
blk.35.ffn_down.weightI32[28672 12288]
-
blk.35.ffn_gate.weightI32[12288 28672]
-
blk.35.ffn_up.weightI32[12288 28672]
-
blk.35.ffn_norm.weightF32[12288]
-
blk.35.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.35.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.35.attn_v.weightQ4_K[12288 1024]
-
blk.36.ffn_gate.weightI32[12288 28672]
-
blk.36.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.36.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.36.attn_v.weightQ4_K[12288 1024]
-
blk.36.attn_norm.weightF32[12288]
-
blk.36.ffn_down.weightI32[28672 12288]
-
blk.36.ffn_up.weightI32[12288 28672]
-
blk.36.ffn_norm.weightF32[12288]
-
blk.37.attn_norm.weightF32[12288]
-
blk.37.ffn_down.weightI32[28672 12288]
-
blk.37.ffn_gate.weightI32[12288 28672]
-
blk.37.ffn_up.weightI32[12288 28672]
-
blk.37.ffn_norm.weightF32[12288]
-
blk.37.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.37.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.37.attn_v.weightQ4_K[12288 1024]
-
blk.38.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.38.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.38.attn_v.weightQ4_K[12288 1024]
-
blk.38.attn_norm.weightF32[12288]
-
blk.38.ffn_down.weightI32[28672 12288]
-
blk.38.ffn_gate.weightI32[12288 28672]
-
blk.38.ffn_up.weightI32[12288 28672]
-
blk.38.ffn_norm.weightF32[12288]
-
blk.39.attn_norm.weightF32[12288]
-
blk.39.ffn_down.weightI32[28672 12288]
-
blk.39.ffn_gate.weightI32[12288 28672]
-
blk.39.ffn_up.weightI32[12288 28672]
-
blk.39.ffn_norm.weightF32[12288]
-
blk.39.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.39.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.39.attn_v.weightQ4_K[12288 1024]
-
blk.40.attn_norm.weightF32[12288]
-
blk.40.ffn_down.weightI32[28672 12288]
-
blk.40.ffn_gate.weightI32[12288 28672]
-
blk.40.ffn_up.weightI32[12288 28672]
-
blk.40.ffn_norm.weightF32[12288]
-
blk.40.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.40.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.40.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.40.attn_v.weightQ4_K[12288 1024]
-
blk.41.ffn_gate.weightI32[12288 28672]
-
blk.41.ffn_up.weightI32[12288 28672]
-
blk.41.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.41.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.41.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.41.attn_v.weightQ4_K[12288 1024]
-
blk.41.attn_norm.weightF32[12288]
-
blk.41.ffn_down.weightI32[28672 12288]
-
blk.41.ffn_norm.weightF32[12288]
-
blk.42.attn_norm.weightF32[12288]
-
blk.42.ffn_down.weightI32[28672 12288]
-
blk.42.ffn_gate.weightI32[12288 28672]
-
blk.42.ffn_up.weightI32[12288 28672]
-
blk.42.ffn_norm.weightF32[12288]
-
blk.42.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.42.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.42.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.42.attn_v.weightQ4_K[12288 1024]
-
blk.43.ffn_gate.weightI32[12288 28672]
-
blk.43.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.43.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.43.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.43.attn_v.weightQ4_K[12288 1024]
-
blk.43.attn_norm.weightF32[12288]
-
blk.43.ffn_down.weightI32[28672 12288]
-
blk.43.ffn_up.weightI32[12288 28672]
-
blk.43.ffn_norm.weightF32[12288]
-
blk.44.attn_norm.weightF32[12288]
-
blk.44.ffn_down.weightI32[28672 12288]
-
blk.44.ffn_gate.weightI32[12288 28672]
-
blk.44.ffn_up.weightI32[12288 28672]
-
blk.44.ffn_norm.weightF32[12288]
-
blk.44.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.44.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.44.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.44.attn_v.weightQ4_K[12288 1024]
-
blk.45.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.45.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.45.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.45.attn_v.weightQ4_K[12288 1024]
-
blk.45.attn_norm.weightF32[12288]
-
blk.45.ffn_down.weightI32[28672 12288]
-
blk.45.ffn_gate.weightI32[12288 28672]
-
blk.45.ffn_up.weightI32[12288 28672]
-
blk.45.ffn_norm.weightF32[12288]
-
blk.46.attn_norm.weightF32[12288]
-
blk.46.ffn_down.weightI32[28672 12288]
-
blk.46.ffn_gate.weightI32[12288 28672]
-
blk.46.ffn_up.weightI32[12288 28672]
-
blk.46.ffn_norm.weightF32[12288]
-
blk.46.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.46.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.46.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.46.attn_v.weightQ4_K[12288 1024]
-
blk.47.attn_norm.weightF32[12288]
-
blk.47.ffn_down.weightI32[28672 12288]
-
blk.47.ffn_gate.weightI32[12288 28672]
-
blk.47.ffn_up.weightI32[12288 28672]
-
blk.47.ffn_norm.weightF32[12288]
-
blk.47.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.47.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.47.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.47.attn_v.weightQ4_K[12288 1024]
-
blk.48.ffn_gate.weightI32[12288 28672]
-
blk.48.ffn_up.weightI32[12288 28672]
-
blk.48.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.48.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.48.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.48.attn_v.weightQ4_K[12288 1024]
-
blk.48.attn_norm.weightF32[12288]
-
blk.48.ffn_down.weightI32[28672 12288]
-
blk.48.ffn_norm.weightF32[12288]
-
blk.49.attn_norm.weightF32[12288]
-
blk.49.ffn_down.weightI32[28672 12288]
-
blk.49.ffn_gate.weightI32[12288 28672]
-
blk.49.ffn_up.weightI32[12288 28672]
-
blk.49.ffn_norm.weightF32[12288]
-
blk.49.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.49.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.49.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.49.attn_v.weightQ4_K[12288 1024]
-
blk.50.ffn_gate.weightI32[12288 28672]
-
blk.50.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.50.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.50.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.50.attn_v.weightQ4_K[12288 1024]
-
blk.50.attn_norm.weightF32[12288]
-
blk.50.ffn_down.weightI32[28672 12288]
-
blk.50.ffn_up.weightI32[12288 28672]
-
blk.50.ffn_norm.weightF32[12288]
-
blk.51.attn_norm.weightF32[12288]
-
blk.51.ffn_down.weightI32[28672 12288]
-
blk.51.ffn_gate.weightI32[12288 28672]
-
blk.51.ffn_up.weightI32[12288 28672]
-
blk.51.ffn_norm.weightF32[12288]
-
blk.51.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.51.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.51.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.51.attn_v.weightQ4_K[12288 1024]
-
blk.52.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.52.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.52.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.52.attn_v.weightQ4_K[12288 1024]
-
blk.52.attn_norm.weightF32[12288]
-
blk.52.ffn_down.weightI32[28672 12288]
-
blk.52.ffn_gate.weightI32[12288 28672]
-
blk.52.ffn_up.weightI32[12288 28672]
-
blk.52.ffn_norm.weightF32[12288]
-
blk.53.attn_norm.weightF32[12288]
-
blk.53.ffn_down.weightI32[28672 12288]
-
blk.53.ffn_gate.weightI32[12288 28672]
-
blk.53.ffn_up.weightI32[12288 28672]
-
blk.53.ffn_norm.weightF32[12288]
-
blk.53.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.53.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.53.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.53.attn_v.weightQ4_K[12288 1024]
-
blk.54.attn_norm.weightF32[12288]
-
blk.54.ffn_down.weightI32[28672 12288]
-
blk.54.ffn_gate.weightI32[12288 28672]
-
blk.54.ffn_up.weightI32[12288 28672]
-
blk.54.ffn_norm.weightF32[12288]
-
blk.54.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.54.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.54.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.54.attn_v.weightQ4_K[12288 1024]
-
blk.55.ffn_gate.weightI32[12288 28672]
-
blk.55.ffn_up.weightI32[12288 28672]
-
blk.55.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.55.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.55.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.55.attn_v.weightQ4_K[12288 1024]
-
blk.55.attn_norm.weightF32[12288]
-
blk.55.ffn_down.weightI32[28672 12288]
-
blk.55.ffn_norm.weightF32[12288]
-
blk.56.attn_norm.weightF32[12288]
-
blk.56.ffn_down.weightI32[28672 12288]
-
blk.56.ffn_gate.weightI32[12288 28672]
-
blk.56.ffn_up.weightI32[12288 28672]
-
blk.56.ffn_norm.weightF32[12288]
-
blk.56.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.56.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.56.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.56.attn_v.weightQ4_K[12288 1024]
-
blk.57.ffn_gate.weightI32[12288 28672]
-
blk.57.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.57.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.57.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.57.attn_v.weightQ4_K[12288 1024]
-
blk.57.attn_norm.weightF32[12288]
-
blk.57.ffn_down.weightI32[28672 12288]
-
blk.57.ffn_up.weightI32[12288 28672]
-
blk.57.ffn_norm.weightF32[12288]
-
blk.58.attn_norm.weightF32[12288]
-
blk.58.ffn_down.weightI32[28672 12288]
-
blk.58.ffn_gate.weightI32[12288 28672]
-
blk.58.ffn_up.weightI32[12288 28672]
-
blk.58.ffn_norm.weightF32[12288]
-
blk.58.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.58.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.58.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.58.attn_v.weightQ4_K[12288 1024]
-
blk.59.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.59.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.59.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.59.attn_v.weightQ4_K[12288 1024]
-
blk.59.attn_norm.weightF32[12288]
-
blk.59.ffn_down.weightI32[28672 12288]
-
blk.59.ffn_gate.weightI32[12288 28672]
-
blk.59.ffn_up.weightI32[12288 28672]
-
blk.59.ffn_norm.weightF32[12288]
-
blk.60.attn_norm.weightF32[12288]
-
blk.60.ffn_down.weightI32[28672 12288]
-
blk.60.ffn_gate.weightI32[12288 28672]
-
blk.60.ffn_up.weightI32[12288 28672]
-
blk.60.ffn_norm.weightF32[12288]
-
blk.60.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.60.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.60.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.60.attn_v.weightQ4_K[12288 1024]
-
blk.61.attn_norm.weightF32[12288]
-
blk.61.ffn_down.weightI32[28672 12288]
-
blk.61.ffn_gate.weightI32[12288 28672]
-
blk.61.ffn_up.weightI32[12288 28672]
-
blk.61.ffn_norm.weightF32[12288]
-
blk.61.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.61.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.61.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.61.attn_v.weightQ4_K[12288 1024]
-
blk.62.ffn_gate.weightI32[12288 28672]
-
blk.62.ffn_up.weightI32[12288 28672]
-
blk.62.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.62.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.62.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.62.attn_v.weightQ4_K[12288 1024]
-
blk.62.attn_norm.weightF32[12288]
-
blk.62.ffn_down.weightI32[28672 12288]
-
blk.62.ffn_norm.weightF32[12288]
-
blk.63.attn_norm.weightF32[12288]
-
blk.63.ffn_down.weightI32[28672 12288]
-
blk.63.ffn_gate.weightI32[12288 28672]
-
blk.63.ffn_up.weightI32[12288 28672]
-
blk.63.ffn_norm.weightF32[12288]
-
blk.63.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.63.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.63.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.63.attn_v.weightQ4_K[12288 1024]
-
blk.64.ffn_gate.weightI32[12288 28672]
-
blk.64.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.64.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.64.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.64.attn_v.weightQ4_K[12288 1024]
-
blk.64.attn_norm.weightF32[12288]
-
blk.64.ffn_down.weightI32[28672 12288]
-
blk.64.ffn_up.weightI32[12288 28672]
-
blk.64.ffn_norm.weightF32[12288]
-
blk.65.attn_norm.weightF32[12288]
-
blk.65.ffn_down.weightI32[28672 12288]
-
blk.65.ffn_gate.weightI32[12288 28672]
-
blk.65.ffn_up.weightI32[12288 28672]
-
blk.65.ffn_norm.weightF32[12288]
-
blk.65.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.65.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.65.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.65.attn_v.weightQ4_K[12288 1024]
-
blk.66.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.66.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.66.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.66.attn_v.weightQ4_K[12288 1024]
-
blk.66.attn_norm.weightF32[12288]
-
blk.66.ffn_down.weightI32[28672 12288]
-
blk.66.ffn_gate.weightI32[12288 28672]
-
blk.66.ffn_up.weightI32[12288 28672]
-
blk.66.ffn_norm.weightF32[12288]
-
blk.67.attn_norm.weightF32[12288]
-
blk.67.ffn_down.weightI32[28672 12288]
-
blk.67.ffn_gate.weightI32[12288 28672]
-
blk.67.ffn_up.weightI32[12288 28672]
-
blk.67.ffn_norm.weightF32[12288]
-
blk.67.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.67.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.67.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.67.attn_v.weightQ4_K[12288 1024]
-
blk.68.attn_norm.weightF32[12288]
-
blk.68.ffn_down.weightI32[28672 12288]
-
blk.68.ffn_gate.weightI32[12288 28672]
-
blk.68.ffn_up.weightI32[12288 28672]
-
blk.68.ffn_norm.weightF32[12288]
-
blk.68.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.68.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.68.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.68.attn_v.weightQ4_K[12288 1024]
-
blk.69.ffn_gate.weightI32[12288 28672]
-
blk.69.ffn_up.weightI32[12288 28672]
-
blk.69.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.69.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.69.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.69.attn_v.weightQ4_K[12288 1024]
-
blk.69.attn_norm.weightF32[12288]
-
blk.69.ffn_down.weightI32[28672 12288]
-
blk.69.ffn_norm.weightF32[12288]
-
blk.70.attn_norm.weightF32[12288]
-
blk.70.ffn_down.weightI32[28672 12288]
-
blk.70.ffn_gate.weightI32[12288 28672]
-
blk.70.ffn_up.weightI32[12288 28672]
-
blk.70.ffn_norm.weightF32[12288]
-
blk.70.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.70.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.70.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.70.attn_v.weightQ4_K[12288 1024]
-
blk.71.ffn_gate.weightI32[12288 28672]
-
blk.71.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.71.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.71.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.71.attn_v.weightQ4_K[12288 1024]
-
blk.71.attn_norm.weightF32[12288]
-
blk.71.ffn_down.weightI32[28672 12288]
-
blk.71.ffn_up.weightI32[12288 28672]
-
blk.71.ffn_norm.weightF32[12288]
-
blk.72.attn_norm.weightF32[12288]
-
blk.72.ffn_down.weightI32[28672 12288]
-
blk.72.ffn_gate.weightI32[12288 28672]
-
blk.72.ffn_up.weightI32[12288 28672]
-
blk.72.ffn_norm.weightF32[12288]
-
blk.72.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.72.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.72.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.72.attn_v.weightQ4_K[12288 1024]
-
blk.73.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.73.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.73.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.73.attn_v.weightQ4_K[12288 1024]
-
blk.73.attn_norm.weightF32[12288]
-
blk.73.ffn_down.weightI32[28672 12288]
-
blk.73.ffn_gate.weightI32[12288 28672]
-
blk.73.ffn_up.weightI32[12288 28672]
-
blk.73.ffn_norm.weightF32[12288]
-
blk.74.attn_norm.weightF32[12288]
-
blk.74.ffn_down.weightI32[28672 12288]
-
blk.74.ffn_gate.weightI32[12288 28672]
-
blk.74.ffn_up.weightI32[12288 28672]
-
blk.74.ffn_norm.weightF32[12288]
-
blk.74.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.74.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.74.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.74.attn_v.weightQ4_K[12288 1024]
-
blk.75.attn_norm.weightF32[12288]
-
blk.75.ffn_down.weightI32[28672 12288]
-
blk.75.ffn_gate.weightI32[12288 28672]
-
blk.75.ffn_up.weightI32[12288 28672]
-
blk.75.ffn_norm.weightF32[12288]
-
blk.75.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.75.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.75.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.75.attn_v.weightQ4_K[12288 1024]
-
blk.76.ffn_gate.weightI32[12288 28672]
-
blk.76.ffn_up.weightI32[12288 28672]
-
blk.76.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.76.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.76.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.76.attn_v.weightQ4_K[12288 1024]
-
blk.76.attn_norm.weightF32[12288]
-
blk.76.ffn_down.weightI32[28672 12288]
-
blk.76.ffn_norm.weightF32[12288]
-
blk.77.attn_norm.weightF32[12288]
-
blk.77.ffn_down.weightI32[28672 12288]
-
blk.77.ffn_gate.weightI32[12288 28672]
-
blk.77.ffn_up.weightI32[12288 28672]
-
blk.77.ffn_norm.weightF32[12288]
-
blk.77.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.77.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.77.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.77.attn_v.weightQ4_K[12288 1024]
-
blk.78.ffn_gate.weightI32[12288 28672]
-
blk.78.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.78.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.78.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.78.attn_v.weightQ4_K[12288 1024]
-
blk.78.attn_norm.weightF32[12288]
-
blk.78.ffn_down.weightI32[28672 12288]
-
blk.78.ffn_up.weightI32[12288 28672]
-
blk.78.ffn_norm.weightF32[12288]
-
blk.79.attn_norm.weightF32[12288]
-
blk.79.ffn_down.weightI32[28672 12288]
-
blk.79.ffn_gate.weightI32[12288 28672]
-
blk.79.ffn_up.weightI32[12288 28672]
-
blk.79.ffn_norm.weightF32[12288]
-
blk.79.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.79.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.79.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.79.attn_v.weightQ4_K[12288 1024]
-
blk.80.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.80.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.80.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.80.attn_v.weightQ4_K[12288 1024]
-
blk.80.attn_norm.weightF32[12288]
-
blk.80.ffn_down.weightI32[28672 12288]
-
blk.80.ffn_gate.weightI32[12288 28672]
-
blk.80.ffn_up.weightI32[12288 28672]
-
blk.80.ffn_norm.weightF32[12288]
-
blk.81.attn_norm.weightF32[12288]
-
blk.81.ffn_down.weightI32[28672 12288]
-
blk.81.ffn_gate.weightI32[12288 28672]
-
blk.81.ffn_up.weightI32[12288 28672]
-
blk.81.ffn_norm.weightF32[12288]
-
blk.81.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.81.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.81.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.81.attn_v.weightQ4_K[12288 1024]
-
blk.82.attn_norm.weightF32[12288]
-
blk.82.ffn_down.weightI32[28672 12288]
-
blk.82.ffn_gate.weightI32[12288 28672]
-
blk.82.ffn_up.weightI32[12288 28672]
-
blk.82.ffn_norm.weightF32[12288]
-
blk.82.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.82.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.82.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.82.attn_v.weightQ4_K[12288 1024]
-
blk.83.ffn_gate.weightI32[12288 28672]
-
blk.83.ffn_up.weightI32[12288 28672]
-
blk.83.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.83.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.83.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.83.attn_v.weightQ4_K[12288 1024]
-
blk.83.attn_norm.weightF32[12288]
-
blk.83.ffn_down.weightI32[28672 12288]
-
blk.83.ffn_norm.weightF32[12288]
-
blk.84.attn_norm.weightF32[12288]
-
blk.84.ffn_down.weightI32[28672 12288]
-
blk.84.ffn_gate.weightI32[12288 28672]
-
blk.84.ffn_up.weightI32[12288 28672]
-
blk.84.ffn_norm.weightF32[12288]
-
blk.84.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.84.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.84.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.84.attn_v.weightQ4_K[12288 1024]
-
blk.85.ffn_gate.weightI32[12288 28672]
-
blk.85.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.85.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.85.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.85.attn_v.weightQ4_K[12288 1024]
-
blk.85.attn_norm.weightF32[12288]
-
blk.85.ffn_down.weightI32[28672 12288]
-
blk.85.ffn_up.weightI32[12288 28672]
-
blk.85.ffn_norm.weightF32[12288]
-
blk.86.attn_norm.weightF32[12288]
-
blk.86.ffn_down.weightI32[28672 12288]
-
blk.86.ffn_gate.weightI32[12288 28672]
-
blk.86.ffn_up.weightI32[12288 28672]
-
blk.86.ffn_norm.weightF32[12288]
-
blk.86.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.86.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.86.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.86.attn_v.weightQ4_K[12288 1024]
-
blk.87.attn_k.weight(!unknown_type 22!)[12288 1024]
-
blk.87.attn_output.weight(!unknown_type 21!)[12288 12288]
-
blk.87.attn_q.weight(!unknown_type 22!)[12288 12288]
-
blk.87.attn_v.weightQ4_K[12288 1024]
-
blk.87.attn_norm.weightF32[12288]
-
blk.87.ffn_down.weightI32[28672 12288]
-
blk.87.ffn_gate.weightI32[12288 28672]
-
blk.87.ffn_up.weightI32[12288 28672]
-
blk.87.ffn_norm.weightF32[12288]
-
output.weightQ5_K[12288 32768]
-
output_norm.weightF32[12288]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85
blk.86
blk.87