Models
Docs
Pricing
Sign in
Download
Models
Download
Docs
Pricing
Sign in
SetneufPT
/
Qwen3.6-27B-MTP_Q3_32K_16GB-GPU
:latest
743
Downloads
Updated
1 week ago
Custom model for coding with agents to use locally with 16gb GPUs (working fine...)
Custom model for coding with agents to use locally with 16gb GPUs (working fine...)
Cancel
Qwen3.6-27B-MTP_Q3_32K_16GB-GPU:latest
...
/
model
8624c775deed · 14GB
Metadata
general.architecture
qwen35
qwen35
general.file_type
Q3_K_M
Q3_K_M
qwen35.attention.head_count
24
24
qwen35.attention.head_count_kv
4
4
qwen35.attention.key_length
256
256
qwen35.attention.layer_norm_rms_epsilon
1e-06
1e-06
qwen35.attention.value_length
256
256
qwen35.block_count
65
65
qwen35.context_length
262144
262144
qwen35.embedding_length
5120
5120
qwen35.feed_forward_length
17408
17408
qwen35.full_attention_interval
4
4
qwen35.nextn_predict_layers
1
1
qwen35.rope.dimension_count
64
64
qwen35.rope.dimension_sections
[11, 11, 10, 0]
[11, 11, 10, 0]
qwen35.rope.freq_base
1e+07
1e+07
qwen35.ssm.conv_kernel
4
4
qwen35.ssm.group_count
16
16
qwen35.ssm.inner_size
6144
6144
qwen35.ssm.state_size
128
128
qwen35.ssm.time_step_rank
48
48
tokenizer.ggml.add_bos_token
false
false
tokenizer.ggml.bos_token_id
248044
248044
tokenizer.ggml.eos_token_id
248046
248046
tokenizer.ggml.merges
[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
tokenizer.ggml.model
gpt2
gpt2
tokenizer.ggml.padding_token_id
248055
248055
tokenizer.ggml.pre
qwen35
qwen35
tokenizer.ggml.token_type
[1, 1, 1, 1, 1, ...]
[1, 1, 1, 1, 1, ...]
tokenizer.ggml.tokens
[!, ", #, $, %, ...]
[!, ", #, $, %, ...]
quantize.imatrix.chunks_count
76
76
quantize.imatrix.dataset
unsloth_calibration_Qwen3.6-27B.txt
unsloth_calibration_Qwen3.6-27B.txt
quantize.imatrix.entries_count
496
496
quantize.imatrix.file
Qwen3.6-27B-GGUF/imatrix_unsloth.gguf
Qwen3.6-27B-GGUF/imatrix_unsloth.gguf
Tensor
Name
Type
Shape
token_embd.weight
Q3_K
Q3_K
[5120, 248320]
blk.0
blk.0.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.0.attn_norm.weight
F32
F32
[5120]
blk.0.attn_qkv.weight
Q5_K
Q5_K
[5120, 10240]
blk.0.ffn_down.weight
Q5_K
Q5_K
[17408, 5120]
blk.0.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.0.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.0.post_attention_norm.weight
F32
F32
[5120]
blk.0.ssm_a
F32
F32
[48]
blk.0.ssm_alpha.weight
F32
F32
[5120, 48]
blk.0.ssm_beta.weight
F32
F32
[5120, 48]
blk.0.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.0.ssm_dt.bias
F32
F32
[48]
blk.0.ssm_norm.weight
F32
F32
[128]
blk.0.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.1
blk.1.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.1.attn_norm.weight
F32
F32
[5120]
blk.1.attn_qkv.weight
Q5_K
Q5_K
[5120, 10240]
blk.1.ffn_down.weight
Q5_K
Q5_K
[17408, 5120]
blk.1.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.1.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.1.post_attention_norm.weight
F32
F32
[5120]
blk.1.ssm_a
F32
F32
[48]
blk.1.ssm_alpha.weight
F32
F32
[5120, 48]
blk.1.ssm_beta.weight
F32
F32
[5120, 48]
blk.1.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.1.ssm_dt.bias
F32
F32
[48]
blk.1.ssm_norm.weight
F32
F32
[128]
blk.1.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.2
blk.2.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.2.attn_norm.weight
F32
F32
[5120]
blk.2.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.2.ffn_down.weight
Q5_K
Q5_K
[17408, 5120]
blk.2.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.2.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.2.post_attention_norm.weight
F32
F32
[5120]
blk.2.ssm_a
F32
F32
[48]
blk.2.ssm_alpha.weight
F32
F32
[5120, 48]
blk.2.ssm_beta.weight
F32
F32
[5120, 48]
blk.2.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.2.ssm_dt.bias
F32
F32
[48]
blk.2.ssm_norm.weight
F32
F32
[128]
blk.2.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.3
blk.3.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.3.attn_k_norm.weight
F32
F32
[256]
blk.3.attn_norm.weight
F32
F32
[5120]
blk.3.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.3.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.3.attn_q_norm.weight
F32
F32
[256]
blk.3.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.3.ffn_down.weight
Q5_K
Q5_K
[17408, 5120]
blk.3.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.3.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.3.post_attention_norm.weight
F32
F32
[5120]
blk.4
blk.4.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.4.attn_norm.weight
F32
F32
[5120]
blk.4.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.4.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.4.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.4.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.4.post_attention_norm.weight
F32
F32
[5120]
blk.4.ssm_a
F32
F32
[48]
blk.4.ssm_alpha.weight
F32
F32
[5120, 48]
blk.4.ssm_beta.weight
F32
F32
[5120, 48]
blk.4.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.4.ssm_dt.bias
F32
F32
[48]
blk.4.ssm_norm.weight
F32
F32
[128]
blk.4.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.5
blk.5.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.5.attn_norm.weight
F32
F32
[5120]
blk.5.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.5.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.5.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.5.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.5.post_attention_norm.weight
F32
F32
[5120]
blk.5.ssm_a
F32
F32
[48]
blk.5.ssm_alpha.weight
F32
F32
[5120, 48]
blk.5.ssm_beta.weight
F32
F32
[5120, 48]
blk.5.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.5.ssm_dt.bias
F32
F32
[48]
blk.5.ssm_norm.weight
F32
F32
[128]
blk.5.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.6
blk.6.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.6.attn_norm.weight
F32
F32
[5120]
blk.6.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.6.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.6.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.6.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.6.post_attention_norm.weight
F32
F32
[5120]
blk.6.ssm_a
F32
F32
[48]
blk.6.ssm_alpha.weight
F32
F32
[5120, 48]
blk.6.ssm_beta.weight
F32
F32
[5120, 48]
blk.6.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.6.ssm_dt.bias
F32
F32
[48]
blk.6.ssm_norm.weight
F32
F32
[128]
blk.6.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.7
blk.7.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.7.attn_k_norm.weight
F32
F32
[256]
blk.7.attn_norm.weight
F32
F32
[5120]
blk.7.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.7.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.7.attn_q_norm.weight
F32
F32
[256]
blk.7.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.7.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.7.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.7.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.7.post_attention_norm.weight
F32
F32
[5120]
blk.8
blk.8.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.8.attn_norm.weight
F32
F32
[5120]
blk.8.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.8.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.8.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.8.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.8.post_attention_norm.weight
F32
F32
[5120]
blk.8.ssm_a
F32
F32
[48]
blk.8.ssm_alpha.weight
F32
F32
[5120, 48]
blk.8.ssm_beta.weight
F32
F32
[5120, 48]
blk.8.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.8.ssm_dt.bias
F32
F32
[48]
blk.8.ssm_norm.weight
F32
F32
[128]
blk.8.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.9
blk.9.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.9.attn_norm.weight
F32
F32
[5120]
blk.9.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.9.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.9.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.9.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.9.post_attention_norm.weight
F32
F32
[5120]
blk.9.ssm_a
F32
F32
[48]
blk.9.ssm_alpha.weight
F32
F32
[5120, 48]
blk.9.ssm_beta.weight
F32
F32
[5120, 48]
blk.9.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.9.ssm_dt.bias
F32
F32
[48]
blk.9.ssm_norm.weight
F32
F32
[128]
blk.9.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.10
blk.10.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.10.attn_norm.weight
F32
F32
[5120]
blk.10.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.10.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.10.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.10.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.10.post_attention_norm.weight
F32
F32
[5120]
blk.10.ssm_a
F32
F32
[48]
blk.10.ssm_alpha.weight
F32
F32
[5120, 48]
blk.10.ssm_beta.weight
F32
F32
[5120, 48]
blk.10.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.10.ssm_dt.bias
F32
F32
[48]
blk.10.ssm_norm.weight
F32
F32
[128]
blk.10.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.11
blk.11.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.11.attn_k_norm.weight
F32
F32
[256]
blk.11.attn_norm.weight
F32
F32
[5120]
blk.11.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.11.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.11.attn_q_norm.weight
F32
F32
[256]
blk.11.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.11.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.11.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.11.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.11.post_attention_norm.weight
F32
F32
[5120]
blk.12
blk.12.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.12.attn_norm.weight
F32
F32
[5120]
blk.12.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.12.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.12.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.12.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.12.post_attention_norm.weight
F32
F32
[5120]
blk.12.ssm_a
F32
F32
[48]
blk.12.ssm_alpha.weight
F32
F32
[5120, 48]
blk.12.ssm_beta.weight
F32
F32
[5120, 48]
blk.12.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.12.ssm_dt.bias
F32
F32
[48]
blk.12.ssm_norm.weight
F32
F32
[128]
blk.12.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.13
blk.13.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.13.attn_norm.weight
F32
F32
[5120]
blk.13.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.13.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.13.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.13.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.13.post_attention_norm.weight
F32
F32
[5120]
blk.13.ssm_a
F32
F32
[48]
blk.13.ssm_alpha.weight
F32
F32
[5120, 48]
blk.13.ssm_beta.weight
F32
F32
[5120, 48]
blk.13.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.13.ssm_dt.bias
F32
F32
[48]
blk.13.ssm_norm.weight
F32
F32
[128]
blk.13.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.14
blk.14.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.14.attn_norm.weight
F32
F32
[5120]
blk.14.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.14.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.14.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.14.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.14.post_attention_norm.weight
F32
F32
[5120]
blk.14.ssm_a
F32
F32
[48]
blk.14.ssm_alpha.weight
F32
F32
[5120, 48]
blk.14.ssm_beta.weight
F32
F32
[5120, 48]
blk.14.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.14.ssm_dt.bias
F32
F32
[48]
blk.14.ssm_norm.weight
F32
F32
[128]
blk.14.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.15
blk.15.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.15.attn_k_norm.weight
F32
F32
[256]
blk.15.attn_norm.weight
F32
F32
[5120]
blk.15.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.15.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.15.attn_q_norm.weight
F32
F32
[256]
blk.15.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.15.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.15.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.15.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.15.post_attention_norm.weight
F32
F32
[5120]
blk.16
blk.16.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.16.attn_norm.weight
F32
F32
[5120]
blk.16.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.16.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.16.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.16.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.16.post_attention_norm.weight
F32
F32
[5120]
blk.16.ssm_a
F32
F32
[48]
blk.16.ssm_alpha.weight
F32
F32
[5120, 48]
blk.16.ssm_beta.weight
F32
F32
[5120, 48]
blk.16.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.16.ssm_dt.bias
F32
F32
[48]
blk.16.ssm_norm.weight
F32
F32
[128]
blk.16.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.17
blk.17.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.17.attn_norm.weight
F32
F32
[5120]
blk.17.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.17.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.17.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.17.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.17.post_attention_norm.weight
F32
F32
[5120]
blk.17.ssm_a
F32
F32
[48]
blk.17.ssm_alpha.weight
F32
F32
[5120, 48]
blk.17.ssm_beta.weight
F32
F32
[5120, 48]
blk.17.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.17.ssm_dt.bias
F32
F32
[48]
blk.17.ssm_norm.weight
F32
F32
[128]
blk.17.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.18
blk.18.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.18.attn_norm.weight
F32
F32
[5120]
blk.18.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.18.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.18.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.18.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.18.post_attention_norm.weight
F32
F32
[5120]
blk.18.ssm_a
F32
F32
[48]
blk.18.ssm_alpha.weight
F32
F32
[5120, 48]
blk.18.ssm_beta.weight
F32
F32
[5120, 48]
blk.18.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.18.ssm_dt.bias
F32
F32
[48]
blk.18.ssm_norm.weight
F32
F32
[128]
blk.18.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.19
blk.19.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.19.attn_k_norm.weight
F32
F32
[256]
blk.19.attn_norm.weight
F32
F32
[5120]
blk.19.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.19.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.19.attn_q_norm.weight
F32
F32
[256]
blk.19.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.19.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.19.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.19.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.19.post_attention_norm.weight
F32
F32
[5120]
blk.20
blk.20.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.20.attn_norm.weight
F32
F32
[5120]
blk.20.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.20.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.20.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.20.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.20.post_attention_norm.weight
F32
F32
[5120]
blk.20.ssm_a
F32
F32
[48]
blk.20.ssm_alpha.weight
F32
F32
[5120, 48]
blk.20.ssm_beta.weight
F32
F32
[5120, 48]
blk.20.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.20.ssm_dt.bias
F32
F32
[48]
blk.20.ssm_norm.weight
F32
F32
[128]
blk.20.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.21
blk.21.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.21.attn_norm.weight
F32
F32
[5120]
blk.21.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.21.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.21.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.21.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.21.post_attention_norm.weight
F32
F32
[5120]
blk.21.ssm_a
F32
F32
[48]
blk.21.ssm_alpha.weight
F32
F32
[5120, 48]
blk.21.ssm_beta.weight
F32
F32
[5120, 48]
blk.21.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.21.ssm_dt.bias
F32
F32
[48]
blk.21.ssm_norm.weight
F32
F32
[128]
blk.21.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.22
blk.22.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.22.attn_norm.weight
F32
F32
[5120]
blk.22.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.22.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.22.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.22.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.22.post_attention_norm.weight
F32
F32
[5120]
blk.22.ssm_a
F32
F32
[48]
blk.22.ssm_alpha.weight
F32
F32
[5120, 48]
blk.22.ssm_beta.weight
F32
F32
[5120, 48]
blk.22.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.22.ssm_dt.bias
F32
F32
[48]
blk.22.ssm_norm.weight
F32
F32
[128]
blk.22.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.23
blk.23.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.23.attn_k_norm.weight
F32
F32
[256]
blk.23.attn_norm.weight
F32
F32
[5120]
blk.23.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.23.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.23.attn_q_norm.weight
F32
F32
[256]
blk.23.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.23.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.23.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.23.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.23.post_attention_norm.weight
F32
F32
[5120]
blk.24
blk.24.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.24.attn_norm.weight
F32
F32
[5120]
blk.24.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.24.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.24.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.24.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.24.post_attention_norm.weight
F32
F32
[5120]
blk.24.ssm_a
F32
F32
[48]
blk.24.ssm_alpha.weight
F32
F32
[5120, 48]
blk.24.ssm_beta.weight
F32
F32
[5120, 48]
blk.24.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.24.ssm_dt.bias
F32
F32
[48]
blk.24.ssm_norm.weight
F32
F32
[128]
blk.24.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.25
blk.25.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.25.attn_norm.weight
F32
F32
[5120]
blk.25.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.25.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.25.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.25.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.25.post_attention_norm.weight
F32
F32
[5120]
blk.25.ssm_a
F32
F32
[48]
blk.25.ssm_alpha.weight
F32
F32
[5120, 48]
blk.25.ssm_beta.weight
F32
F32
[5120, 48]
blk.25.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.25.ssm_dt.bias
F32
F32
[48]
blk.25.ssm_norm.weight
F32
F32
[128]
blk.25.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.26
blk.26.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.26.attn_norm.weight
F32
F32
[5120]
blk.26.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.26.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.26.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.26.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.26.post_attention_norm.weight
F32
F32
[5120]
blk.26.ssm_a
F32
F32
[48]
blk.26.ssm_alpha.weight
F32
F32
[5120, 48]
blk.26.ssm_beta.weight
F32
F32
[5120, 48]
blk.26.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.26.ssm_dt.bias
F32
F32
[48]
blk.26.ssm_norm.weight
F32
F32
[128]
blk.26.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.27
blk.27.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.27.attn_k_norm.weight
F32
F32
[256]
blk.27.attn_norm.weight
F32
F32
[5120]
blk.27.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.27.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.27.attn_q_norm.weight
F32
F32
[256]
blk.27.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.27.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.27.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.27.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.27.post_attention_norm.weight
F32
F32
[5120]
blk.28
blk.28.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.28.attn_norm.weight
F32
F32
[5120]
blk.28.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.28.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.28.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.28.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.28.post_attention_norm.weight
F32
F32
[5120]
blk.28.ssm_a
F32
F32
[48]
blk.28.ssm_alpha.weight
F32
F32
[5120, 48]
blk.28.ssm_beta.weight
F32
F32
[5120, 48]
blk.28.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.28.ssm_dt.bias
F32
F32
[48]
blk.28.ssm_norm.weight
F32
F32
[128]
blk.28.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.29
blk.29.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.29.attn_norm.weight
F32
F32
[5120]
blk.29.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.29.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.29.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.29.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.29.post_attention_norm.weight
F32
F32
[5120]
blk.29.ssm_a
F32
F32
[48]
blk.29.ssm_alpha.weight
F32
F32
[5120, 48]
blk.29.ssm_beta.weight
F32
F32
[5120, 48]
blk.29.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.29.ssm_dt.bias
F32
F32
[48]
blk.29.ssm_norm.weight
F32
F32
[128]
blk.29.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.30
blk.30.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.30.attn_norm.weight
F32
F32
[5120]
blk.30.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.30.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.30.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.30.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.30.post_attention_norm.weight
F32
F32
[5120]
blk.30.ssm_a
F32
F32
[48]
blk.30.ssm_alpha.weight
F32
F32
[5120, 48]
blk.30.ssm_beta.weight
F32
F32
[5120, 48]
blk.30.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.30.ssm_dt.bias
F32
F32
[48]
blk.30.ssm_norm.weight
F32
F32
[128]
blk.30.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.31
blk.31.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.31.attn_k_norm.weight
F32
F32
[256]
blk.31.attn_norm.weight
F32
F32
[5120]
blk.31.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.31.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.31.attn_q_norm.weight
F32
F32
[256]
blk.31.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.31.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.31.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.31.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.31.post_attention_norm.weight
F32
F32
[5120]
blk.32
blk.32.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.32.attn_norm.weight
F32
F32
[5120]
blk.32.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.32.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.32.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.32.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.32.post_attention_norm.weight
F32
F32
[5120]
blk.32.ssm_a
F32
F32
[48]
blk.32.ssm_alpha.weight
F32
F32
[5120, 48]
blk.32.ssm_beta.weight
F32
F32
[5120, 48]
blk.32.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.32.ssm_dt.bias
F32
F32
[48]
blk.32.ssm_norm.weight
F32
F32
[128]
blk.32.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.33
blk.33.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.33.attn_norm.weight
F32
F32
[5120]
blk.33.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.33.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.33.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.33.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.33.post_attention_norm.weight
F32
F32
[5120]
blk.33.ssm_a
F32
F32
[48]
blk.33.ssm_alpha.weight
F32
F32
[5120, 48]
blk.33.ssm_beta.weight
F32
F32
[5120, 48]
blk.33.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.33.ssm_dt.bias
F32
F32
[48]
blk.33.ssm_norm.weight
F32
F32
[128]
blk.33.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.34
blk.34.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.34.attn_norm.weight
F32
F32
[5120]
blk.34.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.34.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.34.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.34.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.34.post_attention_norm.weight
F32
F32
[5120]
blk.34.ssm_a
F32
F32
[48]
blk.34.ssm_alpha.weight
F32
F32
[5120, 48]
blk.34.ssm_beta.weight
F32
F32
[5120, 48]
blk.34.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.34.ssm_dt.bias
F32
F32
[48]
blk.34.ssm_norm.weight
F32
F32
[128]
blk.34.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.35
blk.35.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.35.attn_k_norm.weight
F32
F32
[256]
blk.35.attn_norm.weight
F32
F32
[5120]
blk.35.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.35.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.35.attn_q_norm.weight
F32
F32
[256]
blk.35.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.35.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.35.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.35.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.35.post_attention_norm.weight
F32
F32
[5120]
blk.36
blk.36.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.36.attn_norm.weight
F32
F32
[5120]
blk.36.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.36.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.36.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.36.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.36.post_attention_norm.weight
F32
F32
[5120]
blk.36.ssm_a
F32
F32
[48]
blk.36.ssm_alpha.weight
F32
F32
[5120, 48]
blk.36.ssm_beta.weight
F32
F32
[5120, 48]
blk.36.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.36.ssm_dt.bias
F32
F32
[48]
blk.36.ssm_norm.weight
F32
F32
[128]
blk.36.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.37
blk.37.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.37.attn_norm.weight
F32
F32
[5120]
blk.37.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.37.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.37.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.37.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.37.post_attention_norm.weight
F32
F32
[5120]
blk.37.ssm_a
F32
F32
[48]
blk.37.ssm_alpha.weight
F32
F32
[5120, 48]
blk.37.ssm_beta.weight
F32
F32
[5120, 48]
blk.37.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.37.ssm_dt.bias
F32
F32
[48]
blk.37.ssm_norm.weight
F32
F32
[128]
blk.37.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.38
blk.38.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.38.attn_norm.weight
F32
F32
[5120]
blk.38.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.38.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.38.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.38.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.38.post_attention_norm.weight
F32
F32
[5120]
blk.38.ssm_a
F32
F32
[48]
blk.38.ssm_alpha.weight
F32
F32
[5120, 48]
blk.38.ssm_beta.weight
F32
F32
[5120, 48]
blk.38.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.38.ssm_dt.bias
F32
F32
[48]
blk.38.ssm_norm.weight
F32
F32
[128]
blk.38.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.39
blk.39.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.39.attn_k_norm.weight
F32
F32
[256]
blk.39.attn_norm.weight
F32
F32
[5120]
blk.39.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.39.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.39.attn_q_norm.weight
F32
F32
[256]
blk.39.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.39.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.39.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.39.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.39.post_attention_norm.weight
F32
F32
[5120]
blk.40
blk.40.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.40.attn_norm.weight
F32
F32
[5120]
blk.40.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.40.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.40.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.40.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.40.post_attention_norm.weight
F32
F32
[5120]
blk.40.ssm_a
F32
F32
[48]
blk.40.ssm_alpha.weight
F32
F32
[5120, 48]
blk.40.ssm_beta.weight
F32
F32
[5120, 48]
blk.40.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.40.ssm_dt.bias
F32
F32
[48]
blk.40.ssm_norm.weight
F32
F32
[128]
blk.40.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.41
blk.41.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.41.attn_norm.weight
F32
F32
[5120]
blk.41.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.41.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.41.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.41.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.41.post_attention_norm.weight
F32
F32
[5120]
blk.41.ssm_a
F32
F32
[48]
blk.41.ssm_alpha.weight
F32
F32
[5120, 48]
blk.41.ssm_beta.weight
F32
F32
[5120, 48]
blk.41.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.41.ssm_dt.bias
F32
F32
[48]
blk.41.ssm_norm.weight
F32
F32
[128]
blk.41.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.42
blk.42.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.42.attn_norm.weight
F32
F32
[5120]
blk.42.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.42.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.42.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.42.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.42.post_attention_norm.weight
F32
F32
[5120]
blk.42.ssm_a
F32
F32
[48]
blk.42.ssm_alpha.weight
F32
F32
[5120, 48]
blk.42.ssm_beta.weight
F32
F32
[5120, 48]
blk.42.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.42.ssm_dt.bias
F32
F32
[48]
blk.42.ssm_norm.weight
F32
F32
[128]
blk.42.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.43
blk.43.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.43.attn_k_norm.weight
F32
F32
[256]
blk.43.attn_norm.weight
F32
F32
[5120]
blk.43.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.43.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.43.attn_q_norm.weight
F32
F32
[256]
blk.43.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.43.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.43.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.43.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.43.post_attention_norm.weight
F32
F32
[5120]
blk.44
blk.44.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.44.attn_norm.weight
F32
F32
[5120]
blk.44.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.44.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.44.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.44.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.44.post_attention_norm.weight
F32
F32
[5120]
blk.44.ssm_a
F32
F32
[48]
blk.44.ssm_alpha.weight
F32
F32
[5120, 48]
blk.44.ssm_beta.weight
F32
F32
[5120, 48]
blk.44.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.44.ssm_dt.bias
F32
F32
[48]
blk.44.ssm_norm.weight
F32
F32
[128]
blk.44.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.45
blk.45.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.45.attn_norm.weight
F32
F32
[5120]
blk.45.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.45.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.45.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.45.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.45.post_attention_norm.weight
F32
F32
[5120]
blk.45.ssm_a
F32
F32
[48]
blk.45.ssm_alpha.weight
F32
F32
[5120, 48]
blk.45.ssm_beta.weight
F32
F32
[5120, 48]
blk.45.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.45.ssm_dt.bias
F32
F32
[48]
blk.45.ssm_norm.weight
F32
F32
[128]
blk.45.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.46
blk.46.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.46.attn_norm.weight
F32
F32
[5120]
blk.46.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.46.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.46.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.46.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.46.post_attention_norm.weight
F32
F32
[5120]
blk.46.ssm_a
F32
F32
[48]
blk.46.ssm_alpha.weight
F32
F32
[5120, 48]
blk.46.ssm_beta.weight
F32
F32
[5120, 48]
blk.46.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.46.ssm_dt.bias
F32
F32
[48]
blk.46.ssm_norm.weight
F32
F32
[128]
blk.46.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.47
blk.47.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.47.attn_k_norm.weight
F32
F32
[256]
blk.47.attn_norm.weight
F32
F32
[5120]
blk.47.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.47.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.47.attn_q_norm.weight
F32
F32
[256]
blk.47.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.47.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.47.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.47.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.47.post_attention_norm.weight
F32
F32
[5120]
blk.48
blk.48.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.48.attn_norm.weight
F32
F32
[5120]
blk.48.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.48.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.48.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.48.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.48.post_attention_norm.weight
F32
F32
[5120]
blk.48.ssm_a
F32
F32
[48]
blk.48.ssm_alpha.weight
F32
F32
[5120, 48]
blk.48.ssm_beta.weight
F32
F32
[5120, 48]
blk.48.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.48.ssm_dt.bias
F32
F32
[48]
blk.48.ssm_norm.weight
F32
F32
[128]
blk.48.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.49
blk.49.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.49.attn_norm.weight
F32
F32
[5120]
blk.49.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.49.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.49.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.49.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.49.post_attention_norm.weight
F32
F32
[5120]
blk.49.ssm_a
F32
F32
[48]
blk.49.ssm_alpha.weight
F32
F32
[5120, 48]
blk.49.ssm_beta.weight
F32
F32
[5120, 48]
blk.49.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.49.ssm_dt.bias
F32
F32
[48]
blk.49.ssm_norm.weight
F32
F32
[128]
blk.49.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.50
blk.50.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.50.attn_norm.weight
F32
F32
[5120]
blk.50.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.50.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.50.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.50.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.50.post_attention_norm.weight
F32
F32
[5120]
blk.50.ssm_a
F32
F32
[48]
blk.50.ssm_alpha.weight
F32
F32
[5120, 48]
blk.50.ssm_beta.weight
F32
F32
[5120, 48]
blk.50.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.50.ssm_dt.bias
F32
F32
[48]
blk.50.ssm_norm.weight
F32
F32
[128]
blk.50.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.51
blk.51.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.51.attn_k_norm.weight
F32
F32
[256]
blk.51.attn_norm.weight
F32
F32
[5120]
blk.51.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.51.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.51.attn_q_norm.weight
F32
F32
[256]
blk.51.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.51.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.51.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.51.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.51.post_attention_norm.weight
F32
F32
[5120]
blk.52
blk.52.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.52.attn_norm.weight
F32
F32
[5120]
blk.52.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.52.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.52.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.52.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.52.post_attention_norm.weight
F32
F32
[5120]
blk.52.ssm_a
F32
F32
[48]
blk.52.ssm_alpha.weight
F32
F32
[5120, 48]
blk.52.ssm_beta.weight
F32
F32
[5120, 48]
blk.52.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.52.ssm_dt.bias
F32
F32
[48]
blk.52.ssm_norm.weight
F32
F32
[128]
blk.52.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.53
blk.53.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.53.attn_norm.weight
F32
F32
[5120]
blk.53.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.53.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.53.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.53.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.53.post_attention_norm.weight
F32
F32
[5120]
blk.53.ssm_a
F32
F32
[48]
blk.53.ssm_alpha.weight
F32
F32
[5120, 48]
blk.53.ssm_beta.weight
F32
F32
[5120, 48]
blk.53.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.53.ssm_dt.bias
F32
F32
[48]
blk.53.ssm_norm.weight
F32
F32
[128]
blk.53.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.54
blk.54.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.54.attn_norm.weight
F32
F32
[5120]
blk.54.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.54.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.54.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.54.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.54.post_attention_norm.weight
F32
F32
[5120]
blk.54.ssm_a
F32
F32
[48]
blk.54.ssm_alpha.weight
F32
F32
[5120, 48]
blk.54.ssm_beta.weight
F32
F32
[5120, 48]
blk.54.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.54.ssm_dt.bias
F32
F32
[48]
blk.54.ssm_norm.weight
F32
F32
[128]
blk.54.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.55
blk.55.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.55.attn_k_norm.weight
F32
F32
[256]
blk.55.attn_norm.weight
F32
F32
[5120]
blk.55.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.55.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.55.attn_q_norm.weight
F32
F32
[256]
blk.55.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.55.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.55.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.55.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.55.post_attention_norm.weight
F32
F32
[5120]
blk.56
blk.56.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.56.attn_norm.weight
F32
F32
[5120]
blk.56.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.56.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.56.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.56.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.56.post_attention_norm.weight
F32
F32
[5120]
blk.56.ssm_a
F32
F32
[48]
blk.56.ssm_alpha.weight
F32
F32
[5120, 48]
blk.56.ssm_beta.weight
F32
F32
[5120, 48]
blk.56.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.56.ssm_dt.bias
F32
F32
[48]
blk.56.ssm_norm.weight
F32
F32
[128]
blk.56.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.57
blk.57.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.57.attn_norm.weight
F32
F32
[5120]
blk.57.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.57.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.57.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.57.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.57.post_attention_norm.weight
F32
F32
[5120]
blk.57.ssm_a
F32
F32
[48]
blk.57.ssm_alpha.weight
F32
F32
[5120, 48]
blk.57.ssm_beta.weight
F32
F32
[5120, 48]
blk.57.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.57.ssm_dt.bias
F32
F32
[48]
blk.57.ssm_norm.weight
F32
F32
[128]
blk.57.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.58
blk.58.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.58.attn_norm.weight
F32
F32
[5120]
blk.58.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.58.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.58.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.58.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.58.post_attention_norm.weight
F32
F32
[5120]
blk.58.ssm_a
F32
F32
[48]
blk.58.ssm_alpha.weight
F32
F32
[5120, 48]
blk.58.ssm_beta.weight
F32
F32
[5120, 48]
blk.58.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.58.ssm_dt.bias
F32
F32
[48]
blk.58.ssm_norm.weight
F32
F32
[128]
blk.58.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.59
blk.59.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.59.attn_k_norm.weight
F32
F32
[256]
blk.59.attn_norm.weight
F32
F32
[5120]
blk.59.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.59.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.59.attn_q_norm.weight
F32
F32
[256]
blk.59.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.59.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.59.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.59.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.59.post_attention_norm.weight
F32
F32
[5120]
blk.60
blk.60.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.60.attn_norm.weight
F32
F32
[5120]
blk.60.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.60.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.60.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.60.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.60.post_attention_norm.weight
F32
F32
[5120]
blk.60.ssm_a
F32
F32
[48]
blk.60.ssm_alpha.weight
F32
F32
[5120, 48]
blk.60.ssm_beta.weight
F32
F32
[5120, 48]
blk.60.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.60.ssm_dt.bias
F32
F32
[48]
blk.60.ssm_norm.weight
F32
F32
[128]
blk.60.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.61
blk.61.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.61.attn_norm.weight
F32
F32
[5120]
blk.61.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.61.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.61.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.61.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.61.post_attention_norm.weight
F32
F32
[5120]
blk.61.ssm_a
F32
F32
[48]
blk.61.ssm_alpha.weight
F32
F32
[5120, 48]
blk.61.ssm_beta.weight
F32
F32
[5120, 48]
blk.61.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.61.ssm_dt.bias
F32
F32
[48]
blk.61.ssm_norm.weight
F32
F32
[128]
blk.61.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.62
blk.62.attn_gate.weight
Q3_K
Q3_K
[5120, 6144]
blk.62.attn_norm.weight
F32
F32
[5120]
blk.62.attn_qkv.weight
Q4_K
Q4_K
[5120, 10240]
blk.62.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.62.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.62.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.62.post_attention_norm.weight
F32
F32
[5120]
blk.62.ssm_a
F32
F32
[48]
blk.62.ssm_alpha.weight
F32
F32
[5120, 48]
blk.62.ssm_beta.weight
F32
F32
[5120, 48]
blk.62.ssm_conv1d.weight
F32
F32
[4, 10240]
blk.62.ssm_dt.bias
F32
F32
[48]
blk.62.ssm_norm.weight
F32
F32
[128]
blk.62.ssm_out.weight
Q4_K
Q4_K
[6144, 5120]
blk.63
blk.63.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.63.attn_k_norm.weight
F32
F32
[256]
blk.63.attn_norm.weight
F32
F32
[5120]
blk.63.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.63.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.63.attn_q_norm.weight
F32
F32
[256]
blk.63.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.63.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.63.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.63.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.63.post_attention_norm.weight
F32
F32
[5120]
blk.64
blk.64.attn_k.weight
Q3_K
Q3_K
[5120, 1024]
blk.64.attn_k_norm.weight
F32
F32
[256]
blk.64.attn_norm.weight
F32
F32
[5120]
blk.64.attn_output.weight
Q4_K
Q4_K
[6144, 5120]
blk.64.attn_q.weight
Q3_K
Q3_K
[5120, 12288]
blk.64.attn_q_norm.weight
F32
F32
[256]
blk.64.attn_v.weight
Q4_K
Q4_K
[5120, 1024]
blk.64.ffn_down.weight
Q4_K
Q4_K
[17408, 5120]
blk.64.ffn_gate.weight
Q3_K
Q3_K
[5120, 17408]
blk.64.ffn_up.weight
Q3_K
Q3_K
[5120, 17408]
blk.64.nextn.eh_proj.weight
Q8_0
Q8_0
[10240, 5120]
blk.64.nextn.enorm.weight
F32
F32
[5120]
blk.64.nextn.hnorm.weight
F32
F32
[5120]
blk.64.nextn.shared_head_norm.weight
F32
F32
[5120]
blk.64.post_attention_norm.weight
F32
F32
[5120]
output.weight
Q6_K
Q6_K
[5120, 248320]
output_norm.weight
F32
F32
[5120]