RWKV's 6th generation models. RWKV (pronounced RwaKuv) is an RNN with great LLM performance.
1.6b
3b
7b
14b
1,388 Pulls Updated 2 months ago
ad296e798c9b · 8.8GB
-
general.architecturerwkv6rwkv6
-
general.file_typeQ4_K_MQ4_K_M
-
rwkv6.attention.head_count00
-
rwkv6.attention.layer_norm_epsilon1e-051e-05
-
rwkv6.block_count6161
-
rwkv6.context_length10485761048576
-
rwkv6.embedding_length40964096
-
rwkv6.feed_forward_length1433614336
-
rwkv6.rescale_every_n_layers66
-
rwkv6.time_decay_extra_dim128128
-
rwkv6.time_mix_extra_dim6464
-
rwkv6.wkv.head_size6464
-
tokenizer.ggml.bos_token_id00
-
tokenizer.ggml.eos_token_id00
-
tokenizer.ggml.eot_token_id261261
-
tokenizer.ggml.modelrwkvrwkv
-
tokenizer.ggml.token_type[3, 1, 1, 1, 1, ...][3, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[<s>, \x00, \x01, \x02, \x03, ...][<s>, \x00, \x01, \x02, \x03, ...]
-
token_embd.weightQ4_K[4096, 65536]
-
blk.0.attn_norm.biasF32[4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_norm_2.biasF32[4096]
-
blk.0.attn_norm_2.weightF32[4096]
-
blk.0.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.0.channel_mix_lerp_k.weightF32[4096]
-
blk.0.channel_mix_lerp_r.weightF32[4096]
-
blk.0.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.0.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.0.time_mix_decay.weightF32[4096]
-
blk.0.time_mix_decay_w1.weightF32[4096, 128]
-
blk.0.time_mix_decay_w2.weightF32[128, 4096]
-
blk.0.time_mix_first.weightF32[64, 64]
-
blk.0.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.0.time_mix_key.weightQ4_K[4096, 4096]
-
blk.0.time_mix_lerp_g.weightF32[4096]
-
blk.0.time_mix_lerp_k.weightF32[4096]
-
blk.0.time_mix_lerp_r.weightF32[4096]
-
blk.0.time_mix_lerp_v.weightF32[4096]
-
blk.0.time_mix_lerp_w.weightF32[4096]
-
blk.0.time_mix_lerp_x.weightF32[4096]
-
blk.0.time_mix_ln.biasF32[4096]
-
blk.0.time_mix_ln.weightF32[4096]
-
blk.0.time_mix_output.weightQ4_K[4096, 4096]
-
blk.0.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.0.time_mix_value.weightQ4_K[4096, 4096]
-
blk.0.time_mix_w1.weightF32[4096, 320]
-
blk.0.time_mix_w2.weightF32[64, 4096, 5]
-
blk.1.attn_norm.biasF32[4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_norm_2.biasF32[4096]
-
blk.1.attn_norm_2.weightF32[4096]
-
blk.1.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.1.channel_mix_lerp_k.weightF32[4096]
-
blk.1.channel_mix_lerp_r.weightF32[4096]
-
blk.1.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.1.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.1.time_mix_decay.weightF32[4096]
-
blk.1.time_mix_decay_w1.weightF32[4096, 128]
-
blk.1.time_mix_decay_w2.weightF32[128, 4096]
-
blk.1.time_mix_first.weightF32[64, 64]
-
blk.1.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.1.time_mix_key.weightQ4_K[4096, 4096]
-
blk.1.time_mix_lerp_g.weightF32[4096]
-
blk.1.time_mix_lerp_k.weightF32[4096]
-
blk.1.time_mix_lerp_r.weightF32[4096]
-
blk.1.time_mix_lerp_v.weightF32[4096]
-
blk.1.time_mix_lerp_w.weightF32[4096]
-
blk.1.time_mix_lerp_x.weightF32[4096]
-
blk.1.time_mix_ln.biasF32[4096]
-
blk.1.time_mix_ln.weightF32[4096]
-
blk.1.time_mix_output.weightQ4_K[4096, 4096]
-
blk.1.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.1.time_mix_value.weightQ4_K[4096, 4096]
-
blk.1.time_mix_w1.weightF32[4096, 320]
-
blk.1.time_mix_w2.weightF32[64, 4096, 5]
-
blk.2.attn_norm.biasF32[4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_norm_2.biasF32[4096]
-
blk.2.attn_norm_2.weightF32[4096]
-
blk.2.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.2.channel_mix_lerp_k.weightF32[4096]
-
blk.2.channel_mix_lerp_r.weightF32[4096]
-
blk.2.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.2.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.2.time_mix_decay.weightF32[4096]
-
blk.2.time_mix_decay_w1.weightF32[4096, 128]
-
blk.2.time_mix_decay_w2.weightF32[128, 4096]
-
blk.2.time_mix_first.weightF32[64, 64]
-
blk.2.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.2.time_mix_key.weightQ4_K[4096, 4096]
-
blk.2.time_mix_lerp_g.weightF32[4096]
-
blk.2.time_mix_lerp_k.weightF32[4096]
-
blk.2.time_mix_lerp_r.weightF32[4096]
-
blk.2.time_mix_lerp_v.weightF32[4096]
-
blk.2.time_mix_lerp_w.weightF32[4096]
-
blk.2.time_mix_lerp_x.weightF32[4096]
-
blk.2.time_mix_ln.biasF32[4096]
-
blk.2.time_mix_ln.weightF32[4096]
-
blk.2.time_mix_output.weightQ4_K[4096, 4096]
-
blk.2.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.2.time_mix_value.weightQ4_K[4096, 4096]
-
blk.2.time_mix_w1.weightF32[4096, 320]
-
blk.2.time_mix_w2.weightF32[64, 4096, 5]
-
blk.3.attn_norm.biasF32[4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_norm_2.biasF32[4096]
-
blk.3.attn_norm_2.weightF32[4096]
-
blk.3.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.3.channel_mix_lerp_k.weightF32[4096]
-
blk.3.channel_mix_lerp_r.weightF32[4096]
-
blk.3.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.3.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.3.time_mix_decay.weightF32[4096]
-
blk.3.time_mix_decay_w1.weightF32[4096, 128]
-
blk.3.time_mix_decay_w2.weightF32[128, 4096]
-
blk.3.time_mix_first.weightF32[64, 64]
-
blk.3.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.3.time_mix_key.weightQ4_K[4096, 4096]
-
blk.3.time_mix_lerp_g.weightF32[4096]
-
blk.3.time_mix_lerp_k.weightF32[4096]
-
blk.3.time_mix_lerp_r.weightF32[4096]
-
blk.3.time_mix_lerp_v.weightF32[4096]
-
blk.3.time_mix_lerp_w.weightF32[4096]
-
blk.3.time_mix_lerp_x.weightF32[4096]
-
blk.3.time_mix_ln.biasF32[4096]
-
blk.3.time_mix_ln.weightF32[4096]
-
blk.3.time_mix_output.weightQ4_K[4096, 4096]
-
blk.3.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.3.time_mix_value.weightQ4_K[4096, 4096]
-
blk.3.time_mix_w1.weightF32[4096, 320]
-
blk.3.time_mix_w2.weightF32[64, 4096, 5]
-
blk.4.attn_norm.biasF32[4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_norm_2.biasF32[4096]
-
blk.4.attn_norm_2.weightF32[4096]
-
blk.4.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.4.channel_mix_lerp_k.weightF32[4096]
-
blk.4.channel_mix_lerp_r.weightF32[4096]
-
blk.4.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.4.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.4.time_mix_decay.weightF32[4096]
-
blk.4.time_mix_decay_w1.weightF32[4096, 128]
-
blk.4.time_mix_decay_w2.weightF32[128, 4096]
-
blk.4.time_mix_first.weightF32[64, 64]
-
blk.4.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.4.time_mix_key.weightQ4_K[4096, 4096]
-
blk.4.time_mix_lerp_g.weightF32[4096]
-
blk.4.time_mix_lerp_k.weightF32[4096]
-
blk.4.time_mix_lerp_r.weightF32[4096]
-
blk.4.time_mix_lerp_v.weightF32[4096]
-
blk.4.time_mix_lerp_w.weightF32[4096]
-
blk.4.time_mix_lerp_x.weightF32[4096]
-
blk.4.time_mix_ln.biasF32[4096]
-
blk.4.time_mix_ln.weightF32[4096]
-
blk.4.time_mix_output.weightQ4_K[4096, 4096]
-
blk.4.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.4.time_mix_value.weightQ4_K[4096, 4096]
-
blk.4.time_mix_w1.weightF32[4096, 320]
-
blk.4.time_mix_w2.weightF32[64, 4096, 5]
-
blk.5.attn_norm.biasF32[4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_norm_2.biasF32[4096]
-
blk.5.attn_norm_2.weightF32[4096]
-
blk.5.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.5.channel_mix_lerp_k.weightF32[4096]
-
blk.5.channel_mix_lerp_r.weightF32[4096]
-
blk.5.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.5.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.5.time_mix_decay.weightF32[4096]
-
blk.5.time_mix_decay_w1.weightF32[4096, 128]
-
blk.5.time_mix_decay_w2.weightF32[128, 4096]
-
blk.5.time_mix_first.weightF32[64, 64]
-
blk.5.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.5.time_mix_key.weightQ4_K[4096, 4096]
-
blk.5.time_mix_lerp_g.weightF32[4096]
-
blk.5.time_mix_lerp_k.weightF32[4096]
-
blk.5.time_mix_lerp_r.weightF32[4096]
-
blk.5.time_mix_lerp_v.weightF32[4096]
-
blk.5.time_mix_lerp_w.weightF32[4096]
-
blk.5.time_mix_lerp_x.weightF32[4096]
-
blk.5.time_mix_ln.biasF32[4096]
-
blk.5.time_mix_ln.weightF32[4096]
-
blk.5.time_mix_output.weightQ4_K[4096, 4096]
-
blk.5.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.5.time_mix_value.weightQ4_K[4096, 4096]
-
blk.5.time_mix_w1.weightF32[4096, 320]
-
blk.5.time_mix_w2.weightF32[64, 4096, 5]
-
blk.6.attn_norm.biasF32[4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_norm_2.biasF32[4096]
-
blk.6.attn_norm_2.weightF32[4096]
-
blk.6.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.6.channel_mix_lerp_k.weightF32[4096]
-
blk.6.channel_mix_lerp_r.weightF32[4096]
-
blk.6.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.6.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.6.time_mix_decay.weightF32[4096]
-
blk.6.time_mix_decay_w1.weightF32[4096, 128]
-
blk.6.time_mix_decay_w2.weightF32[128, 4096]
-
blk.6.time_mix_first.weightF32[64, 64]
-
blk.6.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.6.time_mix_key.weightQ4_K[4096, 4096]
-
blk.6.time_mix_lerp_g.weightF32[4096]
-
blk.6.time_mix_lerp_k.weightF32[4096]
-
blk.6.time_mix_lerp_r.weightF32[4096]
-
blk.6.time_mix_lerp_v.weightF32[4096]
-
blk.6.time_mix_lerp_w.weightF32[4096]
-
blk.6.time_mix_lerp_x.weightF32[4096]
-
blk.6.time_mix_ln.biasF32[4096]
-
blk.6.time_mix_ln.weightF32[4096]
-
blk.6.time_mix_output.weightQ4_K[4096, 4096]
-
blk.6.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.6.time_mix_value.weightQ4_K[4096, 4096]
-
blk.6.time_mix_w1.weightF32[4096, 320]
-
blk.6.time_mix_w2.weightF32[64, 4096, 5]
-
blk.7.attn_norm.biasF32[4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_norm_2.biasF32[4096]
-
blk.7.attn_norm_2.weightF32[4096]
-
blk.7.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.7.channel_mix_lerp_k.weightF32[4096]
-
blk.7.channel_mix_lerp_r.weightF32[4096]
-
blk.7.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.7.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.7.time_mix_decay.weightF32[4096]
-
blk.7.time_mix_decay_w1.weightF32[4096, 128]
-
blk.7.time_mix_decay_w2.weightF32[128, 4096]
-
blk.7.time_mix_first.weightF32[64, 64]
-
blk.7.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.7.time_mix_key.weightQ4_K[4096, 4096]
-
blk.7.time_mix_lerp_g.weightF32[4096]
-
blk.7.time_mix_lerp_k.weightF32[4096]
-
blk.7.time_mix_lerp_r.weightF32[4096]
-
blk.7.time_mix_lerp_v.weightF32[4096]
-
blk.7.time_mix_lerp_w.weightF32[4096]
-
blk.7.time_mix_lerp_x.weightF32[4096]
-
blk.7.time_mix_ln.biasF32[4096]
-
blk.7.time_mix_ln.weightF32[4096]
-
blk.7.time_mix_output.weightQ4_K[4096, 4096]
-
blk.7.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.7.time_mix_value.weightQ4_K[4096, 4096]
-
blk.7.time_mix_w1.weightF32[4096, 320]
-
blk.7.time_mix_w2.weightF32[64, 4096, 5]
-
blk.8.attn_norm.biasF32[4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_norm_2.biasF32[4096]
-
blk.8.attn_norm_2.weightF32[4096]
-
blk.8.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.8.channel_mix_lerp_k.weightF32[4096]
-
blk.8.channel_mix_lerp_r.weightF32[4096]
-
blk.8.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.8.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.8.time_mix_decay.weightF32[4096]
-
blk.8.time_mix_decay_w1.weightF32[4096, 128]
-
blk.8.time_mix_decay_w2.weightF32[128, 4096]
-
blk.8.time_mix_first.weightF32[64, 64]
-
blk.8.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.8.time_mix_key.weightQ4_K[4096, 4096]
-
blk.8.time_mix_lerp_g.weightF32[4096]
-
blk.8.time_mix_lerp_k.weightF32[4096]
-
blk.8.time_mix_lerp_r.weightF32[4096]
-
blk.8.time_mix_lerp_v.weightF32[4096]
-
blk.8.time_mix_lerp_w.weightF32[4096]
-
blk.8.time_mix_lerp_x.weightF32[4096]
-
blk.8.time_mix_ln.biasF32[4096]
-
blk.8.time_mix_ln.weightF32[4096]
-
blk.8.time_mix_output.weightQ4_K[4096, 4096]
-
blk.8.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.8.time_mix_value.weightQ4_K[4096, 4096]
-
blk.8.time_mix_w1.weightF32[4096, 320]
-
blk.8.time_mix_w2.weightF32[64, 4096, 5]
-
blk.9.attn_norm.biasF32[4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_norm_2.biasF32[4096]
-
blk.9.attn_norm_2.weightF32[4096]
-
blk.9.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.9.channel_mix_lerp_k.weightF32[4096]
-
blk.9.channel_mix_lerp_r.weightF32[4096]
-
blk.9.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.9.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.9.time_mix_decay.weightF32[4096]
-
blk.9.time_mix_decay_w1.weightF32[4096, 128]
-
blk.9.time_mix_decay_w2.weightF32[128, 4096]
-
blk.9.time_mix_first.weightF32[64, 64]
-
blk.9.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.9.time_mix_key.weightQ4_K[4096, 4096]
-
blk.9.time_mix_lerp_g.weightF32[4096]
-
blk.9.time_mix_lerp_k.weightF32[4096]
-
blk.9.time_mix_lerp_r.weightF32[4096]
-
blk.9.time_mix_lerp_v.weightF32[4096]
-
blk.9.time_mix_lerp_w.weightF32[4096]
-
blk.9.time_mix_lerp_x.weightF32[4096]
-
blk.9.time_mix_ln.biasF32[4096]
-
blk.9.time_mix_ln.weightF32[4096]
-
blk.9.time_mix_output.weightQ4_K[4096, 4096]
-
blk.9.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.9.time_mix_value.weightQ4_K[4096, 4096]
-
blk.9.time_mix_w1.weightF32[4096, 320]
-
blk.9.time_mix_w2.weightF32[64, 4096, 5]
-
blk.10.attn_norm.biasF32[4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_norm_2.biasF32[4096]
-
blk.10.attn_norm_2.weightF32[4096]
-
blk.10.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.10.channel_mix_lerp_k.weightF32[4096]
-
blk.10.channel_mix_lerp_r.weightF32[4096]
-
blk.10.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.10.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.10.time_mix_decay.weightF32[4096]
-
blk.10.time_mix_decay_w1.weightF32[4096, 128]
-
blk.10.time_mix_decay_w2.weightF32[128, 4096]
-
blk.10.time_mix_first.weightF32[64, 64]
-
blk.10.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.10.time_mix_key.weightQ4_K[4096, 4096]
-
blk.10.time_mix_lerp_g.weightF32[4096]
-
blk.10.time_mix_lerp_k.weightF32[4096]
-
blk.10.time_mix_lerp_r.weightF32[4096]
-
blk.10.time_mix_lerp_v.weightF32[4096]
-
blk.10.time_mix_lerp_w.weightF32[4096]
-
blk.10.time_mix_lerp_x.weightF32[4096]
-
blk.10.time_mix_ln.biasF32[4096]
-
blk.10.time_mix_ln.weightF32[4096]
-
blk.10.time_mix_output.weightQ4_K[4096, 4096]
-
blk.10.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.10.time_mix_value.weightQ4_K[4096, 4096]
-
blk.10.time_mix_w1.weightF32[4096, 320]
-
blk.10.time_mix_w2.weightF32[64, 4096, 5]
-
blk.11.attn_norm.biasF32[4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_norm_2.biasF32[4096]
-
blk.11.attn_norm_2.weightF32[4096]
-
blk.11.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.11.channel_mix_lerp_k.weightF32[4096]
-
blk.11.channel_mix_lerp_r.weightF32[4096]
-
blk.11.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.11.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.11.time_mix_decay.weightF32[4096]
-
blk.11.time_mix_decay_w1.weightF32[4096, 128]
-
blk.11.time_mix_decay_w2.weightF32[128, 4096]
-
blk.11.time_mix_first.weightF32[64, 64]
-
blk.11.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.11.time_mix_key.weightQ4_K[4096, 4096]
-
blk.11.time_mix_lerp_g.weightF32[4096]
-
blk.11.time_mix_lerp_k.weightF32[4096]
-
blk.11.time_mix_lerp_r.weightF32[4096]
-
blk.11.time_mix_lerp_v.weightF32[4096]
-
blk.11.time_mix_lerp_w.weightF32[4096]
-
blk.11.time_mix_lerp_x.weightF32[4096]
-
blk.11.time_mix_ln.biasF32[4096]
-
blk.11.time_mix_ln.weightF32[4096]
-
blk.11.time_mix_output.weightQ4_K[4096, 4096]
-
blk.11.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.11.time_mix_value.weightQ4_K[4096, 4096]
-
blk.11.time_mix_w1.weightF32[4096, 320]
-
blk.11.time_mix_w2.weightF32[64, 4096, 5]
-
blk.12.attn_norm.biasF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_norm_2.biasF32[4096]
-
blk.12.attn_norm_2.weightF32[4096]
-
blk.12.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.12.channel_mix_lerp_k.weightF32[4096]
-
blk.12.channel_mix_lerp_r.weightF32[4096]
-
blk.12.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.12.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.12.time_mix_decay.weightF32[4096]
-
blk.12.time_mix_decay_w1.weightF32[4096, 128]
-
blk.12.time_mix_decay_w2.weightF32[128, 4096]
-
blk.12.time_mix_first.weightF32[64, 64]
-
blk.12.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.12.time_mix_key.weightQ4_K[4096, 4096]
-
blk.12.time_mix_lerp_g.weightF32[4096]
-
blk.12.time_mix_lerp_k.weightF32[4096]
-
blk.12.time_mix_lerp_r.weightF32[4096]
-
blk.12.time_mix_lerp_v.weightF32[4096]
-
blk.12.time_mix_lerp_w.weightF32[4096]
-
blk.12.time_mix_lerp_x.weightF32[4096]
-
blk.12.time_mix_ln.biasF32[4096]
-
blk.12.time_mix_ln.weightF32[4096]
-
blk.12.time_mix_output.weightQ4_K[4096, 4096]
-
blk.12.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.12.time_mix_value.weightQ4_K[4096, 4096]
-
blk.12.time_mix_w1.weightF32[4096, 320]
-
blk.12.time_mix_w2.weightF32[64, 4096, 5]
-
blk.13.attn_norm.biasF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_norm_2.biasF32[4096]
-
blk.13.attn_norm_2.weightF32[4096]
-
blk.13.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.13.channel_mix_lerp_k.weightF32[4096]
-
blk.13.channel_mix_lerp_r.weightF32[4096]
-
blk.13.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.13.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.13.time_mix_decay.weightF32[4096]
-
blk.13.time_mix_decay_w1.weightF32[4096, 128]
-
blk.13.time_mix_decay_w2.weightF32[128, 4096]
-
blk.13.time_mix_first.weightF32[64, 64]
-
blk.13.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.13.time_mix_key.weightQ4_K[4096, 4096]
-
blk.13.time_mix_lerp_g.weightF32[4096]
-
blk.13.time_mix_lerp_k.weightF32[4096]
-
blk.13.time_mix_lerp_r.weightF32[4096]
-
blk.13.time_mix_lerp_v.weightF32[4096]
-
blk.13.time_mix_lerp_w.weightF32[4096]
-
blk.13.time_mix_lerp_x.weightF32[4096]
-
blk.13.time_mix_ln.biasF32[4096]
-
blk.13.time_mix_ln.weightF32[4096]
-
blk.13.time_mix_output.weightQ4_K[4096, 4096]
-
blk.13.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.13.time_mix_value.weightQ4_K[4096, 4096]
-
blk.13.time_mix_w1.weightF32[4096, 320]
-
blk.13.time_mix_w2.weightF32[64, 4096, 5]
-
blk.14.attn_norm.biasF32[4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_norm_2.biasF32[4096]
-
blk.14.attn_norm_2.weightF32[4096]
-
blk.14.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.14.channel_mix_lerp_k.weightF32[4096]
-
blk.14.channel_mix_lerp_r.weightF32[4096]
-
blk.14.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.14.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.14.time_mix_decay.weightF32[4096]
-
blk.14.time_mix_decay_w1.weightF32[4096, 128]
-
blk.14.time_mix_decay_w2.weightF32[128, 4096]
-
blk.14.time_mix_first.weightF32[64, 64]
-
blk.14.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.14.time_mix_key.weightQ4_K[4096, 4096]
-
blk.14.time_mix_lerp_g.weightF32[4096]
-
blk.14.time_mix_lerp_k.weightF32[4096]
-
blk.14.time_mix_lerp_r.weightF32[4096]
-
blk.14.time_mix_lerp_v.weightF32[4096]
-
blk.14.time_mix_lerp_w.weightF32[4096]
-
blk.14.time_mix_lerp_x.weightF32[4096]
-
blk.14.time_mix_ln.biasF32[4096]
-
blk.14.time_mix_ln.weightF32[4096]
-
blk.14.time_mix_output.weightQ4_K[4096, 4096]
-
blk.14.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.14.time_mix_value.weightQ4_K[4096, 4096]
-
blk.14.time_mix_w1.weightF32[4096, 320]
-
blk.14.time_mix_w2.weightF32[64, 4096, 5]
-
blk.15.attn_norm.biasF32[4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_norm_2.biasF32[4096]
-
blk.15.attn_norm_2.weightF32[4096]
-
blk.15.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.15.channel_mix_lerp_k.weightF32[4096]
-
blk.15.channel_mix_lerp_r.weightF32[4096]
-
blk.15.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.15.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.15.time_mix_decay.weightF32[4096]
-
blk.15.time_mix_decay_w1.weightF32[4096, 128]
-
blk.15.time_mix_decay_w2.weightF32[128, 4096]
-
blk.15.time_mix_first.weightF32[64, 64]
-
blk.15.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.15.time_mix_key.weightQ4_K[4096, 4096]
-
blk.15.time_mix_lerp_g.weightF32[4096]
-
blk.15.time_mix_lerp_k.weightF32[4096]
-
blk.15.time_mix_lerp_r.weightF32[4096]
-
blk.15.time_mix_lerp_v.weightF32[4096]
-
blk.15.time_mix_lerp_w.weightF32[4096]
-
blk.15.time_mix_lerp_x.weightF32[4096]
-
blk.15.time_mix_ln.biasF32[4096]
-
blk.15.time_mix_ln.weightF32[4096]
-
blk.15.time_mix_output.weightQ4_K[4096, 4096]
-
blk.15.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.15.time_mix_value.weightQ4_K[4096, 4096]
-
blk.15.time_mix_w1.weightF32[4096, 320]
-
blk.15.time_mix_w2.weightF32[64, 4096, 5]
-
blk.16.attn_norm.biasF32[4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_norm_2.biasF32[4096]
-
blk.16.attn_norm_2.weightF32[4096]
-
blk.16.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.16.channel_mix_lerp_k.weightF32[4096]
-
blk.16.channel_mix_lerp_r.weightF32[4096]
-
blk.16.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.16.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.16.time_mix_decay.weightF32[4096]
-
blk.16.time_mix_decay_w1.weightF32[4096, 128]
-
blk.16.time_mix_decay_w2.weightF32[128, 4096]
-
blk.16.time_mix_first.weightF32[64, 64]
-
blk.16.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.16.time_mix_key.weightQ4_K[4096, 4096]
-
blk.16.time_mix_lerp_g.weightF32[4096]
-
blk.16.time_mix_lerp_k.weightF32[4096]
-
blk.16.time_mix_lerp_r.weightF32[4096]
-
blk.16.time_mix_lerp_v.weightF32[4096]
-
blk.16.time_mix_lerp_w.weightF32[4096]
-
blk.16.time_mix_lerp_x.weightF32[4096]
-
blk.16.time_mix_ln.biasF32[4096]
-
blk.16.time_mix_ln.weightF32[4096]
-
blk.16.time_mix_output.weightQ4_K[4096, 4096]
-
blk.16.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.16.time_mix_value.weightQ4_K[4096, 4096]
-
blk.16.time_mix_w1.weightF32[4096, 320]
-
blk.16.time_mix_w2.weightF32[64, 4096, 5]
-
blk.17.attn_norm.biasF32[4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_norm_2.biasF32[4096]
-
blk.17.attn_norm_2.weightF32[4096]
-
blk.17.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.17.channel_mix_lerp_k.weightF32[4096]
-
blk.17.channel_mix_lerp_r.weightF32[4096]
-
blk.17.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.17.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.17.time_mix_decay.weightF32[4096]
-
blk.17.time_mix_decay_w1.weightF32[4096, 128]
-
blk.17.time_mix_decay_w2.weightF32[128, 4096]
-
blk.17.time_mix_first.weightF32[64, 64]
-
blk.17.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.17.time_mix_key.weightQ4_K[4096, 4096]
-
blk.17.time_mix_lerp_g.weightF32[4096]
-
blk.17.time_mix_lerp_k.weightF32[4096]
-
blk.17.time_mix_lerp_r.weightF32[4096]
-
blk.17.time_mix_lerp_v.weightF32[4096]
-
blk.17.time_mix_lerp_w.weightF32[4096]
-
blk.17.time_mix_lerp_x.weightF32[4096]
-
blk.17.time_mix_ln.biasF32[4096]
-
blk.17.time_mix_ln.weightF32[4096]
-
blk.17.time_mix_output.weightQ4_K[4096, 4096]
-
blk.17.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.17.time_mix_value.weightQ4_K[4096, 4096]
-
blk.17.time_mix_w1.weightF32[4096, 320]
-
blk.17.time_mix_w2.weightF32[64, 4096, 5]
-
blk.18.attn_norm.biasF32[4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_norm_2.biasF32[4096]
-
blk.18.attn_norm_2.weightF32[4096]
-
blk.18.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.18.channel_mix_lerp_k.weightF32[4096]
-
blk.18.channel_mix_lerp_r.weightF32[4096]
-
blk.18.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.18.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.18.time_mix_decay.weightF32[4096]
-
blk.18.time_mix_decay_w1.weightF32[4096, 128]
-
blk.18.time_mix_decay_w2.weightF32[128, 4096]
-
blk.18.time_mix_first.weightF32[64, 64]
-
blk.18.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.18.time_mix_key.weightQ4_K[4096, 4096]
-
blk.18.time_mix_lerp_g.weightF32[4096]
-
blk.18.time_mix_lerp_k.weightF32[4096]
-
blk.18.time_mix_lerp_r.weightF32[4096]
-
blk.18.time_mix_lerp_v.weightF32[4096]
-
blk.18.time_mix_lerp_w.weightF32[4096]
-
blk.18.time_mix_lerp_x.weightF32[4096]
-
blk.18.time_mix_ln.biasF32[4096]
-
blk.18.time_mix_ln.weightF32[4096]
-
blk.18.time_mix_output.weightQ4_K[4096, 4096]
-
blk.18.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.18.time_mix_value.weightQ4_K[4096, 4096]
-
blk.18.time_mix_w1.weightF32[4096, 320]
-
blk.18.time_mix_w2.weightF32[64, 4096, 5]
-
blk.19.attn_norm.biasF32[4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_norm_2.biasF32[4096]
-
blk.19.attn_norm_2.weightF32[4096]
-
blk.19.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.19.channel_mix_lerp_k.weightF32[4096]
-
blk.19.channel_mix_lerp_r.weightF32[4096]
-
blk.19.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.19.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.19.time_mix_decay.weightF32[4096]
-
blk.19.time_mix_decay_w1.weightF32[4096, 128]
-
blk.19.time_mix_decay_w2.weightF32[128, 4096]
-
blk.19.time_mix_first.weightF32[64, 64]
-
blk.19.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.19.time_mix_key.weightQ4_K[4096, 4096]
-
blk.19.time_mix_lerp_g.weightF32[4096]
-
blk.19.time_mix_lerp_k.weightF32[4096]
-
blk.19.time_mix_lerp_r.weightF32[4096]
-
blk.19.time_mix_lerp_v.weightF32[4096]
-
blk.19.time_mix_lerp_w.weightF32[4096]
-
blk.19.time_mix_lerp_x.weightF32[4096]
-
blk.19.time_mix_ln.biasF32[4096]
-
blk.19.time_mix_ln.weightF32[4096]
-
blk.19.time_mix_output.weightQ4_K[4096, 4096]
-
blk.19.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.19.time_mix_value.weightQ4_K[4096, 4096]
-
blk.19.time_mix_w1.weightF32[4096, 320]
-
blk.19.time_mix_w2.weightF32[64, 4096, 5]
-
blk.20.attn_norm.biasF32[4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_norm_2.biasF32[4096]
-
blk.20.attn_norm_2.weightF32[4096]
-
blk.20.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.20.channel_mix_lerp_k.weightF32[4096]
-
blk.20.channel_mix_lerp_r.weightF32[4096]
-
blk.20.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.20.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.20.time_mix_decay.weightF32[4096]
-
blk.20.time_mix_decay_w1.weightF32[4096, 128]
-
blk.20.time_mix_decay_w2.weightF32[128, 4096]
-
blk.20.time_mix_first.weightF32[64, 64]
-
blk.20.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.20.time_mix_key.weightQ4_K[4096, 4096]
-
blk.20.time_mix_lerp_g.weightF32[4096]
-
blk.20.time_mix_lerp_k.weightF32[4096]
-
blk.20.time_mix_lerp_r.weightF32[4096]
-
blk.20.time_mix_lerp_v.weightF32[4096]
-
blk.20.time_mix_lerp_w.weightF32[4096]
-
blk.20.time_mix_lerp_x.weightF32[4096]
-
blk.20.time_mix_ln.biasF32[4096]
-
blk.20.time_mix_ln.weightF32[4096]
-
blk.20.time_mix_output.weightQ4_K[4096, 4096]
-
blk.20.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.20.time_mix_value.weightQ4_K[4096, 4096]
-
blk.20.time_mix_w1.weightF32[4096, 320]
-
blk.20.time_mix_w2.weightF32[64, 4096, 5]
-
blk.21.attn_norm.biasF32[4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_norm_2.biasF32[4096]
-
blk.21.attn_norm_2.weightF32[4096]
-
blk.21.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.21.channel_mix_lerp_k.weightF32[4096]
-
blk.21.channel_mix_lerp_r.weightF32[4096]
-
blk.21.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.21.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.21.time_mix_decay.weightF32[4096]
-
blk.21.time_mix_decay_w1.weightF32[4096, 128]
-
blk.21.time_mix_decay_w2.weightF32[128, 4096]
-
blk.21.time_mix_first.weightF32[64, 64]
-
blk.21.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.21.time_mix_key.weightQ4_K[4096, 4096]
-
blk.21.time_mix_lerp_g.weightF32[4096]
-
blk.21.time_mix_lerp_k.weightF32[4096]
-
blk.21.time_mix_lerp_r.weightF32[4096]
-
blk.21.time_mix_lerp_v.weightF32[4096]
-
blk.21.time_mix_lerp_w.weightF32[4096]
-
blk.21.time_mix_lerp_x.weightF32[4096]
-
blk.21.time_mix_ln.biasF32[4096]
-
blk.21.time_mix_ln.weightF32[4096]
-
blk.21.time_mix_output.weightQ4_K[4096, 4096]
-
blk.21.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.21.time_mix_value.weightQ4_K[4096, 4096]
-
blk.21.time_mix_w1.weightF32[4096, 320]
-
blk.21.time_mix_w2.weightF32[64, 4096, 5]
-
blk.22.attn_norm.biasF32[4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_norm_2.biasF32[4096]
-
blk.22.attn_norm_2.weightF32[4096]
-
blk.22.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.22.channel_mix_lerp_k.weightF32[4096]
-
blk.22.channel_mix_lerp_r.weightF32[4096]
-
blk.22.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.22.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.22.time_mix_decay.weightF32[4096]
-
blk.22.time_mix_decay_w1.weightF32[4096, 128]
-
blk.22.time_mix_decay_w2.weightF32[128, 4096]
-
blk.22.time_mix_first.weightF32[64, 64]
-
blk.22.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.22.time_mix_key.weightQ4_K[4096, 4096]
-
blk.22.time_mix_lerp_g.weightF32[4096]
-
blk.22.time_mix_lerp_k.weightF32[4096]
-
blk.22.time_mix_lerp_r.weightF32[4096]
-
blk.22.time_mix_lerp_v.weightF32[4096]
-
blk.22.time_mix_lerp_w.weightF32[4096]
-
blk.22.time_mix_lerp_x.weightF32[4096]
-
blk.22.time_mix_ln.biasF32[4096]
-
blk.22.time_mix_ln.weightF32[4096]
-
blk.22.time_mix_output.weightQ4_K[4096, 4096]
-
blk.22.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.22.time_mix_value.weightQ4_K[4096, 4096]
-
blk.22.time_mix_w1.weightF32[4096, 320]
-
blk.22.time_mix_w2.weightF32[64, 4096, 5]
-
blk.23.attn_norm.biasF32[4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_norm_2.biasF32[4096]
-
blk.23.attn_norm_2.weightF32[4096]
-
blk.23.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.23.channel_mix_lerp_k.weightF32[4096]
-
blk.23.channel_mix_lerp_r.weightF32[4096]
-
blk.23.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.23.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.23.time_mix_decay.weightF32[4096]
-
blk.23.time_mix_decay_w1.weightF32[4096, 128]
-
blk.23.time_mix_decay_w2.weightF32[128, 4096]
-
blk.23.time_mix_first.weightF32[64, 64]
-
blk.23.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.23.time_mix_key.weightQ4_K[4096, 4096]
-
blk.23.time_mix_lerp_g.weightF32[4096]
-
blk.23.time_mix_lerp_k.weightF32[4096]
-
blk.23.time_mix_lerp_r.weightF32[4096]
-
blk.23.time_mix_lerp_v.weightF32[4096]
-
blk.23.time_mix_lerp_w.weightF32[4096]
-
blk.23.time_mix_lerp_x.weightF32[4096]
-
blk.23.time_mix_ln.biasF32[4096]
-
blk.23.time_mix_ln.weightF32[4096]
-
blk.23.time_mix_output.weightQ4_K[4096, 4096]
-
blk.23.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.23.time_mix_value.weightQ4_K[4096, 4096]
-
blk.23.time_mix_w1.weightF32[4096, 320]
-
blk.23.time_mix_w2.weightF32[64, 4096, 5]
-
blk.24.attn_norm.biasF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_norm_2.biasF32[4096]
-
blk.24.attn_norm_2.weightF32[4096]
-
blk.24.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.24.channel_mix_lerp_k.weightF32[4096]
-
blk.24.channel_mix_lerp_r.weightF32[4096]
-
blk.24.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.24.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.24.time_mix_decay.weightF32[4096]
-
blk.24.time_mix_decay_w1.weightF32[4096, 128]
-
blk.24.time_mix_decay_w2.weightF32[128, 4096]
-
blk.24.time_mix_first.weightF32[64, 64]
-
blk.24.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.24.time_mix_key.weightQ4_K[4096, 4096]
-
blk.24.time_mix_lerp_g.weightF32[4096]
-
blk.24.time_mix_lerp_k.weightF32[4096]
-
blk.24.time_mix_lerp_r.weightF32[4096]
-
blk.24.time_mix_lerp_v.weightF32[4096]
-
blk.24.time_mix_lerp_w.weightF32[4096]
-
blk.24.time_mix_lerp_x.weightF32[4096]
-
blk.24.time_mix_ln.biasF32[4096]
-
blk.24.time_mix_ln.weightF32[4096]
-
blk.24.time_mix_output.weightQ4_K[4096, 4096]
-
blk.24.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.24.time_mix_value.weightQ4_K[4096, 4096]
-
blk.24.time_mix_w1.weightF32[4096, 320]
-
blk.24.time_mix_w2.weightF32[64, 4096, 5]
-
blk.25.attn_norm.biasF32[4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_norm_2.biasF32[4096]
-
blk.25.attn_norm_2.weightF32[4096]
-
blk.25.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.25.channel_mix_lerp_k.weightF32[4096]
-
blk.25.channel_mix_lerp_r.weightF32[4096]
-
blk.25.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.25.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.25.time_mix_decay.weightF32[4096]
-
blk.25.time_mix_decay_w1.weightF32[4096, 128]
-
blk.25.time_mix_decay_w2.weightF32[128, 4096]
-
blk.25.time_mix_first.weightF32[64, 64]
-
blk.25.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.25.time_mix_key.weightQ4_K[4096, 4096]
-
blk.25.time_mix_lerp_g.weightF32[4096]
-
blk.25.time_mix_lerp_k.weightF32[4096]
-
blk.25.time_mix_lerp_r.weightF32[4096]
-
blk.25.time_mix_lerp_v.weightF32[4096]
-
blk.25.time_mix_lerp_w.weightF32[4096]
-
blk.25.time_mix_lerp_x.weightF32[4096]
-
blk.25.time_mix_ln.biasF32[4096]
-
blk.25.time_mix_ln.weightF32[4096]
-
blk.25.time_mix_output.weightQ4_K[4096, 4096]
-
blk.25.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.25.time_mix_value.weightQ4_K[4096, 4096]
-
blk.25.time_mix_w1.weightF32[4096, 320]
-
blk.25.time_mix_w2.weightF32[64, 4096, 5]
-
blk.26.attn_norm.biasF32[4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_norm_2.biasF32[4096]
-
blk.26.attn_norm_2.weightF32[4096]
-
blk.26.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.26.channel_mix_lerp_k.weightF32[4096]
-
blk.26.channel_mix_lerp_r.weightF32[4096]
-
blk.26.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.26.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.26.time_mix_decay.weightF32[4096]
-
blk.26.time_mix_decay_w1.weightF32[4096, 128]
-
blk.26.time_mix_decay_w2.weightF32[128, 4096]
-
blk.26.time_mix_first.weightF32[64, 64]
-
blk.26.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.26.time_mix_key.weightQ4_K[4096, 4096]
-
blk.26.time_mix_lerp_g.weightF32[4096]
-
blk.26.time_mix_lerp_k.weightF32[4096]
-
blk.26.time_mix_lerp_r.weightF32[4096]
-
blk.26.time_mix_lerp_v.weightF32[4096]
-
blk.26.time_mix_lerp_w.weightF32[4096]
-
blk.26.time_mix_lerp_x.weightF32[4096]
-
blk.26.time_mix_ln.biasF32[4096]
-
blk.26.time_mix_ln.weightF32[4096]
-
blk.26.time_mix_output.weightQ4_K[4096, 4096]
-
blk.26.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.26.time_mix_value.weightQ4_K[4096, 4096]
-
blk.26.time_mix_w1.weightF32[4096, 320]
-
blk.26.time_mix_w2.weightF32[64, 4096, 5]
-
blk.27.attn_norm.biasF32[4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_norm_2.biasF32[4096]
-
blk.27.attn_norm_2.weightF32[4096]
-
blk.27.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.27.channel_mix_lerp_k.weightF32[4096]
-
blk.27.channel_mix_lerp_r.weightF32[4096]
-
blk.27.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.27.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.27.time_mix_decay.weightF32[4096]
-
blk.27.time_mix_decay_w1.weightF32[4096, 128]
-
blk.27.time_mix_decay_w2.weightF32[128, 4096]
-
blk.27.time_mix_first.weightF32[64, 64]
-
blk.27.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.27.time_mix_key.weightQ4_K[4096, 4096]
-
blk.27.time_mix_lerp_g.weightF32[4096]
-
blk.27.time_mix_lerp_k.weightF32[4096]
-
blk.27.time_mix_lerp_r.weightF32[4096]
-
blk.27.time_mix_lerp_v.weightF32[4096]
-
blk.27.time_mix_lerp_w.weightF32[4096]
-
blk.27.time_mix_lerp_x.weightF32[4096]
-
blk.27.time_mix_ln.biasF32[4096]
-
blk.27.time_mix_ln.weightF32[4096]
-
blk.27.time_mix_output.weightQ4_K[4096, 4096]
-
blk.27.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.27.time_mix_value.weightQ4_K[4096, 4096]
-
blk.27.time_mix_w1.weightF32[4096, 320]
-
blk.27.time_mix_w2.weightF32[64, 4096, 5]
-
blk.28.attn_norm.biasF32[4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_norm_2.biasF32[4096]
-
blk.28.attn_norm_2.weightF32[4096]
-
blk.28.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.28.channel_mix_lerp_k.weightF32[4096]
-
blk.28.channel_mix_lerp_r.weightF32[4096]
-
blk.28.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.28.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.28.time_mix_decay.weightF32[4096]
-
blk.28.time_mix_decay_w1.weightF32[4096, 128]
-
blk.28.time_mix_decay_w2.weightF32[128, 4096]
-
blk.28.time_mix_first.weightF32[64, 64]
-
blk.28.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.28.time_mix_key.weightQ4_K[4096, 4096]
-
blk.28.time_mix_lerp_g.weightF32[4096]
-
blk.28.time_mix_lerp_k.weightF32[4096]
-
blk.28.time_mix_lerp_r.weightF32[4096]
-
blk.28.time_mix_lerp_v.weightF32[4096]
-
blk.28.time_mix_lerp_w.weightF32[4096]
-
blk.28.time_mix_lerp_x.weightF32[4096]
-
blk.28.time_mix_ln.biasF32[4096]
-
blk.28.time_mix_ln.weightF32[4096]
-
blk.28.time_mix_output.weightQ4_K[4096, 4096]
-
blk.28.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.28.time_mix_value.weightQ4_K[4096, 4096]
-
blk.28.time_mix_w1.weightF32[4096, 320]
-
blk.28.time_mix_w2.weightF32[64, 4096, 5]
-
blk.29.attn_norm.biasF32[4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_norm_2.biasF32[4096]
-
blk.29.attn_norm_2.weightF32[4096]
-
blk.29.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.29.channel_mix_lerp_k.weightF32[4096]
-
blk.29.channel_mix_lerp_r.weightF32[4096]
-
blk.29.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.29.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.29.time_mix_decay.weightF32[4096]
-
blk.29.time_mix_decay_w1.weightF32[4096, 128]
-
blk.29.time_mix_decay_w2.weightF32[128, 4096]
-
blk.29.time_mix_first.weightF32[64, 64]
-
blk.29.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.29.time_mix_key.weightQ4_K[4096, 4096]
-
blk.29.time_mix_lerp_g.weightF32[4096]
-
blk.29.time_mix_lerp_k.weightF32[4096]
-
blk.29.time_mix_lerp_r.weightF32[4096]
-
blk.29.time_mix_lerp_v.weightF32[4096]
-
blk.29.time_mix_lerp_w.weightF32[4096]
-
blk.29.time_mix_lerp_x.weightF32[4096]
-
blk.29.time_mix_ln.biasF32[4096]
-
blk.29.time_mix_ln.weightF32[4096]
-
blk.29.time_mix_output.weightQ4_K[4096, 4096]
-
blk.29.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.29.time_mix_value.weightQ4_K[4096, 4096]
-
blk.29.time_mix_w1.weightF32[4096, 320]
-
blk.29.time_mix_w2.weightF32[64, 4096, 5]
-
blk.30.attn_norm.biasF32[4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_norm_2.biasF32[4096]
-
blk.30.attn_norm_2.weightF32[4096]
-
blk.30.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.30.channel_mix_lerp_k.weightF32[4096]
-
blk.30.channel_mix_lerp_r.weightF32[4096]
-
blk.30.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.30.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.30.time_mix_decay.weightF32[4096]
-
blk.30.time_mix_decay_w1.weightF32[4096, 128]
-
blk.30.time_mix_decay_w2.weightF32[128, 4096]
-
blk.30.time_mix_first.weightF32[64, 64]
-
blk.30.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.30.time_mix_key.weightQ4_K[4096, 4096]
-
blk.30.time_mix_lerp_g.weightF32[4096]
-
blk.30.time_mix_lerp_k.weightF32[4096]
-
blk.30.time_mix_lerp_r.weightF32[4096]
-
blk.30.time_mix_lerp_v.weightF32[4096]
-
blk.30.time_mix_lerp_w.weightF32[4096]
-
blk.30.time_mix_lerp_x.weightF32[4096]
-
blk.30.time_mix_ln.biasF32[4096]
-
blk.30.time_mix_ln.weightF32[4096]
-
blk.30.time_mix_output.weightQ4_K[4096, 4096]
-
blk.30.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.30.time_mix_value.weightQ4_K[4096, 4096]
-
blk.30.time_mix_w1.weightF32[4096, 320]
-
blk.30.time_mix_w2.weightF32[64, 4096, 5]
-
blk.31.attn_norm.biasF32[4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_norm_2.biasF32[4096]
-
blk.31.attn_norm_2.weightF32[4096]
-
blk.31.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.31.channel_mix_lerp_k.weightF32[4096]
-
blk.31.channel_mix_lerp_r.weightF32[4096]
-
blk.31.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.31.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.31.time_mix_decay.weightF32[4096]
-
blk.31.time_mix_decay_w1.weightF32[4096, 128]
-
blk.31.time_mix_decay_w2.weightF32[128, 4096]
-
blk.31.time_mix_first.weightF32[64, 64]
-
blk.31.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.31.time_mix_key.weightQ4_K[4096, 4096]
-
blk.31.time_mix_lerp_g.weightF32[4096]
-
blk.31.time_mix_lerp_k.weightF32[4096]
-
blk.31.time_mix_lerp_r.weightF32[4096]
-
blk.31.time_mix_lerp_v.weightF32[4096]
-
blk.31.time_mix_lerp_w.weightF32[4096]
-
blk.31.time_mix_lerp_x.weightF32[4096]
-
blk.31.time_mix_ln.biasF32[4096]
-
blk.31.time_mix_ln.weightF32[4096]
-
blk.31.time_mix_output.weightQ4_K[4096, 4096]
-
blk.31.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.31.time_mix_value.weightQ4_K[4096, 4096]
-
blk.31.time_mix_w1.weightF32[4096, 320]
-
blk.31.time_mix_w2.weightF32[64, 4096, 5]
-
blk.32.attn_norm.biasF32[4096]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_norm_2.biasF32[4096]
-
blk.32.attn_norm_2.weightF32[4096]
-
blk.32.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.32.channel_mix_lerp_k.weightF32[4096]
-
blk.32.channel_mix_lerp_r.weightF32[4096]
-
blk.32.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.32.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.32.time_mix_decay.weightF32[4096]
-
blk.32.time_mix_decay_w1.weightF32[4096, 128]
-
blk.32.time_mix_decay_w2.weightF32[128, 4096]
-
blk.32.time_mix_first.weightF32[64, 64]
-
blk.32.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.32.time_mix_key.weightQ4_K[4096, 4096]
-
blk.32.time_mix_lerp_g.weightF32[4096]
-
blk.32.time_mix_lerp_k.weightF32[4096]
-
blk.32.time_mix_lerp_r.weightF32[4096]
-
blk.32.time_mix_lerp_v.weightF32[4096]
-
blk.32.time_mix_lerp_w.weightF32[4096]
-
blk.32.time_mix_lerp_x.weightF32[4096]
-
blk.32.time_mix_ln.biasF32[4096]
-
blk.32.time_mix_ln.weightF32[4096]
-
blk.32.time_mix_output.weightQ4_K[4096, 4096]
-
blk.32.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.32.time_mix_value.weightQ4_K[4096, 4096]
-
blk.32.time_mix_w1.weightF32[4096, 320]
-
blk.32.time_mix_w2.weightF32[64, 4096, 5]
-
blk.33.attn_norm.biasF32[4096]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_norm_2.biasF32[4096]
-
blk.33.attn_norm_2.weightF32[4096]
-
blk.33.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.33.channel_mix_lerp_k.weightF32[4096]
-
blk.33.channel_mix_lerp_r.weightF32[4096]
-
blk.33.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.33.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.33.time_mix_decay.weightF32[4096]
-
blk.33.time_mix_decay_w1.weightF32[4096, 128]
-
blk.33.time_mix_decay_w2.weightF32[128, 4096]
-
blk.33.time_mix_first.weightF32[64, 64]
-
blk.33.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.33.time_mix_key.weightQ4_K[4096, 4096]
-
blk.33.time_mix_lerp_g.weightF32[4096]
-
blk.33.time_mix_lerp_k.weightF32[4096]
-
blk.33.time_mix_lerp_r.weightF32[4096]
-
blk.33.time_mix_lerp_v.weightF32[4096]
-
blk.33.time_mix_lerp_w.weightF32[4096]
-
blk.33.time_mix_lerp_x.weightF32[4096]
-
blk.33.time_mix_ln.biasF32[4096]
-
blk.33.time_mix_ln.weightF32[4096]
-
blk.33.time_mix_output.weightQ4_K[4096, 4096]
-
blk.33.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.33.time_mix_value.weightQ4_K[4096, 4096]
-
blk.33.time_mix_w1.weightF32[4096, 320]
-
blk.33.time_mix_w2.weightF32[64, 4096, 5]
-
blk.34.attn_norm.biasF32[4096]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_norm_2.biasF32[4096]
-
blk.34.attn_norm_2.weightF32[4096]
-
blk.34.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.34.channel_mix_lerp_k.weightF32[4096]
-
blk.34.channel_mix_lerp_r.weightF32[4096]
-
blk.34.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.34.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.34.time_mix_decay.weightF32[4096]
-
blk.34.time_mix_decay_w1.weightF32[4096, 128]
-
blk.34.time_mix_decay_w2.weightF32[128, 4096]
-
blk.34.time_mix_first.weightF32[64, 64]
-
blk.34.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.34.time_mix_key.weightQ4_K[4096, 4096]
-
blk.34.time_mix_lerp_g.weightF32[4096]
-
blk.34.time_mix_lerp_k.weightF32[4096]
-
blk.34.time_mix_lerp_r.weightF32[4096]
-
blk.34.time_mix_lerp_v.weightF32[4096]
-
blk.34.time_mix_lerp_w.weightF32[4096]
-
blk.34.time_mix_lerp_x.weightF32[4096]
-
blk.34.time_mix_ln.biasF32[4096]
-
blk.34.time_mix_ln.weightF32[4096]
-
blk.34.time_mix_output.weightQ4_K[4096, 4096]
-
blk.34.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.34.time_mix_value.weightQ4_K[4096, 4096]
-
blk.34.time_mix_w1.weightF32[4096, 320]
-
blk.34.time_mix_w2.weightF32[64, 4096, 5]
-
blk.35.attn_norm.biasF32[4096]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_norm_2.biasF32[4096]
-
blk.35.attn_norm_2.weightF32[4096]
-
blk.35.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.35.channel_mix_lerp_k.weightF32[4096]
-
blk.35.channel_mix_lerp_r.weightF32[4096]
-
blk.35.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.35.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.35.time_mix_decay.weightF32[4096]
-
blk.35.time_mix_decay_w1.weightF32[4096, 128]
-
blk.35.time_mix_decay_w2.weightF32[128, 4096]
-
blk.35.time_mix_first.weightF32[64, 64]
-
blk.35.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.35.time_mix_key.weightQ4_K[4096, 4096]
-
blk.35.time_mix_lerp_g.weightF32[4096]
-
blk.35.time_mix_lerp_k.weightF32[4096]
-
blk.35.time_mix_lerp_r.weightF32[4096]
-
blk.35.time_mix_lerp_v.weightF32[4096]
-
blk.35.time_mix_lerp_w.weightF32[4096]
-
blk.35.time_mix_lerp_x.weightF32[4096]
-
blk.35.time_mix_ln.biasF32[4096]
-
blk.35.time_mix_ln.weightF32[4096]
-
blk.35.time_mix_output.weightQ4_K[4096, 4096]
-
blk.35.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.35.time_mix_value.weightQ4_K[4096, 4096]
-
blk.35.time_mix_w1.weightF32[4096, 320]
-
blk.35.time_mix_w2.weightF32[64, 4096, 5]
-
blk.36.attn_norm.biasF32[4096]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_norm_2.biasF32[4096]
-
blk.36.attn_norm_2.weightF32[4096]
-
blk.36.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.36.channel_mix_lerp_k.weightF32[4096]
-
blk.36.channel_mix_lerp_r.weightF32[4096]
-
blk.36.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.36.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.36.time_mix_decay.weightF32[4096]
-
blk.36.time_mix_decay_w1.weightF32[4096, 128]
-
blk.36.time_mix_decay_w2.weightF32[128, 4096]
-
blk.36.time_mix_first.weightF32[64, 64]
-
blk.36.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.36.time_mix_key.weightQ4_K[4096, 4096]
-
blk.36.time_mix_lerp_g.weightF32[4096]
-
blk.36.time_mix_lerp_k.weightF32[4096]
-
blk.36.time_mix_lerp_r.weightF32[4096]
-
blk.36.time_mix_lerp_v.weightF32[4096]
-
blk.36.time_mix_lerp_w.weightF32[4096]
-
blk.36.time_mix_lerp_x.weightF32[4096]
-
blk.36.time_mix_ln.biasF32[4096]
-
blk.36.time_mix_ln.weightF32[4096]
-
blk.36.time_mix_output.weightQ4_K[4096, 4096]
-
blk.36.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.36.time_mix_value.weightQ4_K[4096, 4096]
-
blk.36.time_mix_w1.weightF32[4096, 320]
-
blk.36.time_mix_w2.weightF32[64, 4096, 5]
-
blk.37.attn_norm.biasF32[4096]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_norm_2.biasF32[4096]
-
blk.37.attn_norm_2.weightF32[4096]
-
blk.37.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.37.channel_mix_lerp_k.weightF32[4096]
-
blk.37.channel_mix_lerp_r.weightF32[4096]
-
blk.37.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.37.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.37.time_mix_decay.weightF32[4096]
-
blk.37.time_mix_decay_w1.weightF32[4096, 128]
-
blk.37.time_mix_decay_w2.weightF32[128, 4096]
-
blk.37.time_mix_first.weightF32[64, 64]
-
blk.37.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.37.time_mix_key.weightQ4_K[4096, 4096]
-
blk.37.time_mix_lerp_g.weightF32[4096]
-
blk.37.time_mix_lerp_k.weightF32[4096]
-
blk.37.time_mix_lerp_r.weightF32[4096]
-
blk.37.time_mix_lerp_v.weightF32[4096]
-
blk.37.time_mix_lerp_w.weightF32[4096]
-
blk.37.time_mix_lerp_x.weightF32[4096]
-
blk.37.time_mix_ln.biasF32[4096]
-
blk.37.time_mix_ln.weightF32[4096]
-
blk.37.time_mix_output.weightQ4_K[4096, 4096]
-
blk.37.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.37.time_mix_value.weightQ4_K[4096, 4096]
-
blk.37.time_mix_w1.weightF32[4096, 320]
-
blk.37.time_mix_w2.weightF32[64, 4096, 5]
-
blk.38.attn_norm.biasF32[4096]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_norm_2.biasF32[4096]
-
blk.38.attn_norm_2.weightF32[4096]
-
blk.38.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.38.channel_mix_lerp_k.weightF32[4096]
-
blk.38.channel_mix_lerp_r.weightF32[4096]
-
blk.38.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.38.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.38.time_mix_decay.weightF32[4096]
-
blk.38.time_mix_decay_w1.weightF32[4096, 128]
-
blk.38.time_mix_decay_w2.weightF32[128, 4096]
-
blk.38.time_mix_first.weightF32[64, 64]
-
blk.38.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.38.time_mix_key.weightQ4_K[4096, 4096]
-
blk.38.time_mix_lerp_g.weightF32[4096]
-
blk.38.time_mix_lerp_k.weightF32[4096]
-
blk.38.time_mix_lerp_r.weightF32[4096]
-
blk.38.time_mix_lerp_v.weightF32[4096]
-
blk.38.time_mix_lerp_w.weightF32[4096]
-
blk.38.time_mix_lerp_x.weightF32[4096]
-
blk.38.time_mix_ln.biasF32[4096]
-
blk.38.time_mix_ln.weightF32[4096]
-
blk.38.time_mix_output.weightQ4_K[4096, 4096]
-
blk.38.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.38.time_mix_value.weightQ4_K[4096, 4096]
-
blk.38.time_mix_w1.weightF32[4096, 320]
-
blk.38.time_mix_w2.weightF32[64, 4096, 5]
-
blk.39.attn_norm.biasF32[4096]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_norm_2.biasF32[4096]
-
blk.39.attn_norm_2.weightF32[4096]
-
blk.39.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.39.channel_mix_lerp_k.weightF32[4096]
-
blk.39.channel_mix_lerp_r.weightF32[4096]
-
blk.39.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.39.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.39.time_mix_decay.weightF32[4096]
-
blk.39.time_mix_decay_w1.weightF32[4096, 128]
-
blk.39.time_mix_decay_w2.weightF32[128, 4096]
-
blk.39.time_mix_first.weightF32[64, 64]
-
blk.39.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.39.time_mix_key.weightQ4_K[4096, 4096]
-
blk.39.time_mix_lerp_g.weightF32[4096]
-
blk.39.time_mix_lerp_k.weightF32[4096]
-
blk.39.time_mix_lerp_r.weightF32[4096]
-
blk.39.time_mix_lerp_v.weightF32[4096]
-
blk.39.time_mix_lerp_w.weightF32[4096]
-
blk.39.time_mix_lerp_x.weightF32[4096]
-
blk.39.time_mix_ln.biasF32[4096]
-
blk.39.time_mix_ln.weightF32[4096]
-
blk.39.time_mix_output.weightQ4_K[4096, 4096]
-
blk.39.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.39.time_mix_value.weightQ4_K[4096, 4096]
-
blk.39.time_mix_w1.weightF32[4096, 320]
-
blk.39.time_mix_w2.weightF32[64, 4096, 5]
-
blk.40.attn_norm.biasF32[4096]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_norm_2.biasF32[4096]
-
blk.40.attn_norm_2.weightF32[4096]
-
blk.40.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.40.channel_mix_lerp_k.weightF32[4096]
-
blk.40.channel_mix_lerp_r.weightF32[4096]
-
blk.40.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.40.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.40.time_mix_decay.weightF32[4096]
-
blk.40.time_mix_decay_w1.weightF32[4096, 128]
-
blk.40.time_mix_decay_w2.weightF32[128, 4096]
-
blk.40.time_mix_first.weightF32[64, 64]
-
blk.40.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.40.time_mix_key.weightQ4_K[4096, 4096]
-
blk.40.time_mix_lerp_g.weightF32[4096]
-
blk.40.time_mix_lerp_k.weightF32[4096]
-
blk.40.time_mix_lerp_r.weightF32[4096]
-
blk.40.time_mix_lerp_v.weightF32[4096]
-
blk.40.time_mix_lerp_w.weightF32[4096]
-
blk.40.time_mix_lerp_x.weightF32[4096]
-
blk.40.time_mix_ln.biasF32[4096]
-
blk.40.time_mix_ln.weightF32[4096]
-
blk.40.time_mix_output.weightQ4_K[4096, 4096]
-
blk.40.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.40.time_mix_value.weightQ4_K[4096, 4096]
-
blk.40.time_mix_w1.weightF32[4096, 320]
-
blk.40.time_mix_w2.weightF32[64, 4096, 5]
-
blk.41.attn_norm.biasF32[4096]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_norm_2.biasF32[4096]
-
blk.41.attn_norm_2.weightF32[4096]
-
blk.41.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.41.channel_mix_lerp_k.weightF32[4096]
-
blk.41.channel_mix_lerp_r.weightF32[4096]
-
blk.41.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.41.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.41.time_mix_decay.weightF32[4096]
-
blk.41.time_mix_decay_w1.weightF32[4096, 128]
-
blk.41.time_mix_decay_w2.weightF32[128, 4096]
-
blk.41.time_mix_first.weightF32[64, 64]
-
blk.41.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.41.time_mix_key.weightQ4_K[4096, 4096]
-
blk.41.time_mix_lerp_g.weightF32[4096]
-
blk.41.time_mix_lerp_k.weightF32[4096]
-
blk.41.time_mix_lerp_r.weightF32[4096]
-
blk.41.time_mix_lerp_v.weightF32[4096]
-
blk.41.time_mix_lerp_w.weightF32[4096]
-
blk.41.time_mix_lerp_x.weightF32[4096]
-
blk.41.time_mix_ln.biasF32[4096]
-
blk.41.time_mix_ln.weightF32[4096]
-
blk.41.time_mix_output.weightQ4_K[4096, 4096]
-
blk.41.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.41.time_mix_value.weightQ4_K[4096, 4096]
-
blk.41.time_mix_w1.weightF32[4096, 320]
-
blk.41.time_mix_w2.weightF32[64, 4096, 5]
-
blk.42.attn_norm.biasF32[4096]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_norm_2.biasF32[4096]
-
blk.42.attn_norm_2.weightF32[4096]
-
blk.42.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.42.channel_mix_lerp_k.weightF32[4096]
-
blk.42.channel_mix_lerp_r.weightF32[4096]
-
blk.42.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.42.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.42.time_mix_decay.weightF32[4096]
-
blk.42.time_mix_decay_w1.weightF32[4096, 128]
-
blk.42.time_mix_decay_w2.weightF32[128, 4096]
-
blk.42.time_mix_first.weightF32[64, 64]
-
blk.42.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.42.time_mix_key.weightQ4_K[4096, 4096]
-
blk.42.time_mix_lerp_g.weightF32[4096]
-
blk.42.time_mix_lerp_k.weightF32[4096]
-
blk.42.time_mix_lerp_r.weightF32[4096]
-
blk.42.time_mix_lerp_v.weightF32[4096]
-
blk.42.time_mix_lerp_w.weightF32[4096]
-
blk.42.time_mix_lerp_x.weightF32[4096]
-
blk.42.time_mix_ln.biasF32[4096]
-
blk.42.time_mix_ln.weightF32[4096]
-
blk.42.time_mix_output.weightQ4_K[4096, 4096]
-
blk.42.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.42.time_mix_value.weightQ4_K[4096, 4096]
-
blk.42.time_mix_w1.weightF32[4096, 320]
-
blk.42.time_mix_w2.weightF32[64, 4096, 5]
-
blk.43.attn_norm.biasF32[4096]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_norm_2.biasF32[4096]
-
blk.43.attn_norm_2.weightF32[4096]
-
blk.43.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.43.channel_mix_lerp_k.weightF32[4096]
-
blk.43.channel_mix_lerp_r.weightF32[4096]
-
blk.43.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.43.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.43.time_mix_decay.weightF32[4096]
-
blk.43.time_mix_decay_w1.weightF32[4096, 128]
-
blk.43.time_mix_decay_w2.weightF32[128, 4096]
-
blk.43.time_mix_first.weightF32[64, 64]
-
blk.43.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.43.time_mix_key.weightQ4_K[4096, 4096]
-
blk.43.time_mix_lerp_g.weightF32[4096]
-
blk.43.time_mix_lerp_k.weightF32[4096]
-
blk.43.time_mix_lerp_r.weightF32[4096]
-
blk.43.time_mix_lerp_v.weightF32[4096]
-
blk.43.time_mix_lerp_w.weightF32[4096]
-
blk.43.time_mix_lerp_x.weightF32[4096]
-
blk.43.time_mix_ln.biasF32[4096]
-
blk.43.time_mix_ln.weightF32[4096]
-
blk.43.time_mix_output.weightQ4_K[4096, 4096]
-
blk.43.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.43.time_mix_value.weightQ4_K[4096, 4096]
-
blk.43.time_mix_w1.weightF32[4096, 320]
-
blk.43.time_mix_w2.weightF32[64, 4096, 5]
-
blk.44.attn_norm.biasF32[4096]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_norm_2.biasF32[4096]
-
blk.44.attn_norm_2.weightF32[4096]
-
blk.44.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.44.channel_mix_lerp_k.weightF32[4096]
-
blk.44.channel_mix_lerp_r.weightF32[4096]
-
blk.44.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.44.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.44.time_mix_decay.weightF32[4096]
-
blk.44.time_mix_decay_w1.weightF32[4096, 128]
-
blk.44.time_mix_decay_w2.weightF32[128, 4096]
-
blk.44.time_mix_first.weightF32[64, 64]
-
blk.44.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.44.time_mix_key.weightQ4_K[4096, 4096]
-
blk.44.time_mix_lerp_g.weightF32[4096]
-
blk.44.time_mix_lerp_k.weightF32[4096]
-
blk.44.time_mix_lerp_r.weightF32[4096]
-
blk.44.time_mix_lerp_v.weightF32[4096]
-
blk.44.time_mix_lerp_w.weightF32[4096]
-
blk.44.time_mix_lerp_x.weightF32[4096]
-
blk.44.time_mix_ln.biasF32[4096]
-
blk.44.time_mix_ln.weightF32[4096]
-
blk.44.time_mix_output.weightQ4_K[4096, 4096]
-
blk.44.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.44.time_mix_value.weightQ4_K[4096, 4096]
-
blk.44.time_mix_w1.weightF32[4096, 320]
-
blk.44.time_mix_w2.weightF32[64, 4096, 5]
-
blk.45.attn_norm.biasF32[4096]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_norm_2.biasF32[4096]
-
blk.45.attn_norm_2.weightF32[4096]
-
blk.45.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.45.channel_mix_lerp_k.weightF32[4096]
-
blk.45.channel_mix_lerp_r.weightF32[4096]
-
blk.45.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.45.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.45.time_mix_decay.weightF32[4096]
-
blk.45.time_mix_decay_w1.weightF32[4096, 128]
-
blk.45.time_mix_decay_w2.weightF32[128, 4096]
-
blk.45.time_mix_first.weightF32[64, 64]
-
blk.45.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.45.time_mix_key.weightQ4_K[4096, 4096]
-
blk.45.time_mix_lerp_g.weightF32[4096]
-
blk.45.time_mix_lerp_k.weightF32[4096]
-
blk.45.time_mix_lerp_r.weightF32[4096]
-
blk.45.time_mix_lerp_v.weightF32[4096]
-
blk.45.time_mix_lerp_w.weightF32[4096]
-
blk.45.time_mix_lerp_x.weightF32[4096]
-
blk.45.time_mix_ln.biasF32[4096]
-
blk.45.time_mix_ln.weightF32[4096]
-
blk.45.time_mix_output.weightQ4_K[4096, 4096]
-
blk.45.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.45.time_mix_value.weightQ4_K[4096, 4096]
-
blk.45.time_mix_w1.weightF32[4096, 320]
-
blk.45.time_mix_w2.weightF32[64, 4096, 5]
-
blk.46.attn_norm.biasF32[4096]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_norm_2.biasF32[4096]
-
blk.46.attn_norm_2.weightF32[4096]
-
blk.46.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.46.channel_mix_lerp_k.weightF32[4096]
-
blk.46.channel_mix_lerp_r.weightF32[4096]
-
blk.46.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.46.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.46.time_mix_decay.weightF32[4096]
-
blk.46.time_mix_decay_w1.weightF32[4096, 128]
-
blk.46.time_mix_decay_w2.weightF32[128, 4096]
-
blk.46.time_mix_first.weightF32[64, 64]
-
blk.46.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.46.time_mix_key.weightQ4_K[4096, 4096]
-
blk.46.time_mix_lerp_g.weightF32[4096]
-
blk.46.time_mix_lerp_k.weightF32[4096]
-
blk.46.time_mix_lerp_r.weightF32[4096]
-
blk.46.time_mix_lerp_v.weightF32[4096]
-
blk.46.time_mix_lerp_w.weightF32[4096]
-
blk.46.time_mix_lerp_x.weightF32[4096]
-
blk.46.time_mix_ln.biasF32[4096]
-
blk.46.time_mix_ln.weightF32[4096]
-
blk.46.time_mix_output.weightQ4_K[4096, 4096]
-
blk.46.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.46.time_mix_value.weightQ4_K[4096, 4096]
-
blk.46.time_mix_w1.weightF32[4096, 320]
-
blk.46.time_mix_w2.weightF32[64, 4096, 5]
-
blk.47.attn_norm.biasF32[4096]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_norm_2.biasF32[4096]
-
blk.47.attn_norm_2.weightF32[4096]
-
blk.47.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.47.channel_mix_lerp_k.weightF32[4096]
-
blk.47.channel_mix_lerp_r.weightF32[4096]
-
blk.47.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.47.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.47.time_mix_decay.weightF32[4096]
-
blk.47.time_mix_decay_w1.weightF32[4096, 128]
-
blk.47.time_mix_decay_w2.weightF32[128, 4096]
-
blk.47.time_mix_first.weightF32[64, 64]
-
blk.47.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.47.time_mix_key.weightQ4_K[4096, 4096]
-
blk.47.time_mix_lerp_g.weightF32[4096]
-
blk.47.time_mix_lerp_k.weightF32[4096]
-
blk.47.time_mix_lerp_r.weightF32[4096]
-
blk.47.time_mix_lerp_v.weightF32[4096]
-
blk.47.time_mix_lerp_w.weightF32[4096]
-
blk.47.time_mix_lerp_x.weightF32[4096]
-
blk.47.time_mix_ln.biasF32[4096]
-
blk.47.time_mix_ln.weightF32[4096]
-
blk.47.time_mix_output.weightQ4_K[4096, 4096]
-
blk.47.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.47.time_mix_value.weightQ4_K[4096, 4096]
-
blk.47.time_mix_w1.weightF32[4096, 320]
-
blk.47.time_mix_w2.weightF32[64, 4096, 5]
-
blk.48.attn_norm.biasF32[4096]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_norm_2.biasF32[4096]
-
blk.48.attn_norm_2.weightF32[4096]
-
blk.48.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.48.channel_mix_lerp_k.weightF32[4096]
-
blk.48.channel_mix_lerp_r.weightF32[4096]
-
blk.48.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.48.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.48.time_mix_decay.weightF32[4096]
-
blk.48.time_mix_decay_w1.weightF32[4096, 128]
-
blk.48.time_mix_decay_w2.weightF32[128, 4096]
-
blk.48.time_mix_first.weightF32[64, 64]
-
blk.48.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.48.time_mix_key.weightQ4_K[4096, 4096]
-
blk.48.time_mix_lerp_g.weightF32[4096]
-
blk.48.time_mix_lerp_k.weightF32[4096]
-
blk.48.time_mix_lerp_r.weightF32[4096]
-
blk.48.time_mix_lerp_v.weightF32[4096]
-
blk.48.time_mix_lerp_w.weightF32[4096]
-
blk.48.time_mix_lerp_x.weightF32[4096]
-
blk.48.time_mix_ln.biasF32[4096]
-
blk.48.time_mix_ln.weightF32[4096]
-
blk.48.time_mix_output.weightQ4_K[4096, 4096]
-
blk.48.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.48.time_mix_value.weightQ4_K[4096, 4096]
-
blk.48.time_mix_w1.weightF32[4096, 320]
-
blk.48.time_mix_w2.weightF32[64, 4096, 5]
-
blk.49.attn_norm.biasF32[4096]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_norm_2.biasF32[4096]
-
blk.49.attn_norm_2.weightF32[4096]
-
blk.49.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.49.channel_mix_lerp_k.weightF32[4096]
-
blk.49.channel_mix_lerp_r.weightF32[4096]
-
blk.49.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.49.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.49.time_mix_decay.weightF32[4096]
-
blk.49.time_mix_decay_w1.weightF32[4096, 128]
-
blk.49.time_mix_decay_w2.weightF32[128, 4096]
-
blk.49.time_mix_first.weightF32[64, 64]
-
blk.49.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.49.time_mix_key.weightQ4_K[4096, 4096]
-
blk.49.time_mix_lerp_g.weightF32[4096]
-
blk.49.time_mix_lerp_k.weightF32[4096]
-
blk.49.time_mix_lerp_r.weightF32[4096]
-
blk.49.time_mix_lerp_v.weightF32[4096]
-
blk.49.time_mix_lerp_w.weightF32[4096]
-
blk.49.time_mix_lerp_x.weightF32[4096]
-
blk.49.time_mix_ln.biasF32[4096]
-
blk.49.time_mix_ln.weightF32[4096]
-
blk.49.time_mix_output.weightQ4_K[4096, 4096]
-
blk.49.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.49.time_mix_value.weightQ4_K[4096, 4096]
-
blk.49.time_mix_w1.weightF32[4096, 320]
-
blk.49.time_mix_w2.weightF32[64, 4096, 5]
-
blk.50.attn_norm.biasF32[4096]
-
blk.50.attn_norm.weightF32[4096]
-
blk.50.attn_norm_2.biasF32[4096]
-
blk.50.attn_norm_2.weightF32[4096]
-
blk.50.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.50.channel_mix_lerp_k.weightF32[4096]
-
blk.50.channel_mix_lerp_r.weightF32[4096]
-
blk.50.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.50.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.50.time_mix_decay.weightF32[4096]
-
blk.50.time_mix_decay_w1.weightF32[4096, 128]
-
blk.50.time_mix_decay_w2.weightF32[128, 4096]
-
blk.50.time_mix_first.weightF32[64, 64]
-
blk.50.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.50.time_mix_key.weightQ4_K[4096, 4096]
-
blk.50.time_mix_lerp_g.weightF32[4096]
-
blk.50.time_mix_lerp_k.weightF32[4096]
-
blk.50.time_mix_lerp_r.weightF32[4096]
-
blk.50.time_mix_lerp_v.weightF32[4096]
-
blk.50.time_mix_lerp_w.weightF32[4096]
-
blk.50.time_mix_lerp_x.weightF32[4096]
-
blk.50.time_mix_ln.biasF32[4096]
-
blk.50.time_mix_ln.weightF32[4096]
-
blk.50.time_mix_output.weightQ4_K[4096, 4096]
-
blk.50.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.50.time_mix_value.weightQ4_K[4096, 4096]
-
blk.50.time_mix_w1.weightF32[4096, 320]
-
blk.50.time_mix_w2.weightF32[64, 4096, 5]
-
blk.51.attn_norm.biasF32[4096]
-
blk.51.attn_norm.weightF32[4096]
-
blk.51.attn_norm_2.biasF32[4096]
-
blk.51.attn_norm_2.weightF32[4096]
-
blk.51.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.51.channel_mix_lerp_k.weightF32[4096]
-
blk.51.channel_mix_lerp_r.weightF32[4096]
-
blk.51.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.51.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.51.time_mix_decay.weightF32[4096]
-
blk.51.time_mix_decay_w1.weightF32[4096, 128]
-
blk.51.time_mix_decay_w2.weightF32[128, 4096]
-
blk.51.time_mix_first.weightF32[64, 64]
-
blk.51.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.51.time_mix_key.weightQ4_K[4096, 4096]
-
blk.51.time_mix_lerp_g.weightF32[4096]
-
blk.51.time_mix_lerp_k.weightF32[4096]
-
blk.51.time_mix_lerp_r.weightF32[4096]
-
blk.51.time_mix_lerp_v.weightF32[4096]
-
blk.51.time_mix_lerp_w.weightF32[4096]
-
blk.51.time_mix_lerp_x.weightF32[4096]
-
blk.51.time_mix_ln.biasF32[4096]
-
blk.51.time_mix_ln.weightF32[4096]
-
blk.51.time_mix_output.weightQ4_K[4096, 4096]
-
blk.51.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.51.time_mix_value.weightQ4_K[4096, 4096]
-
blk.51.time_mix_w1.weightF32[4096, 320]
-
blk.51.time_mix_w2.weightF32[64, 4096, 5]
-
blk.52.attn_norm.biasF32[4096]
-
blk.52.attn_norm.weightF32[4096]
-
blk.52.attn_norm_2.biasF32[4096]
-
blk.52.attn_norm_2.weightF32[4096]
-
blk.52.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.52.channel_mix_lerp_k.weightF32[4096]
-
blk.52.channel_mix_lerp_r.weightF32[4096]
-
blk.52.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.52.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.52.time_mix_decay.weightF32[4096]
-
blk.52.time_mix_decay_w1.weightF32[4096, 128]
-
blk.52.time_mix_decay_w2.weightF32[128, 4096]
-
blk.52.time_mix_first.weightF32[64, 64]
-
blk.52.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.52.time_mix_key.weightQ4_K[4096, 4096]
-
blk.52.time_mix_lerp_g.weightF32[4096]
-
blk.52.time_mix_lerp_k.weightF32[4096]
-
blk.52.time_mix_lerp_r.weightF32[4096]
-
blk.52.time_mix_lerp_v.weightF32[4096]
-
blk.52.time_mix_lerp_w.weightF32[4096]
-
blk.52.time_mix_lerp_x.weightF32[4096]
-
blk.52.time_mix_ln.biasF32[4096]
-
blk.52.time_mix_ln.weightF32[4096]
-
blk.52.time_mix_output.weightQ4_K[4096, 4096]
-
blk.52.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.52.time_mix_value.weightQ4_K[4096, 4096]
-
blk.52.time_mix_w1.weightF32[4096, 320]
-
blk.52.time_mix_w2.weightF32[64, 4096, 5]
-
blk.53.attn_norm.biasF32[4096]
-
blk.53.attn_norm.weightF32[4096]
-
blk.53.attn_norm_2.biasF32[4096]
-
blk.53.attn_norm_2.weightF32[4096]
-
blk.53.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.53.channel_mix_lerp_k.weightF32[4096]
-
blk.53.channel_mix_lerp_r.weightF32[4096]
-
blk.53.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.53.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.53.time_mix_decay.weightF32[4096]
-
blk.53.time_mix_decay_w1.weightF32[4096, 128]
-
blk.53.time_mix_decay_w2.weightF32[128, 4096]
-
blk.53.time_mix_first.weightF32[64, 64]
-
blk.53.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.53.time_mix_key.weightQ4_K[4096, 4096]
-
blk.53.time_mix_lerp_g.weightF32[4096]
-
blk.53.time_mix_lerp_k.weightF32[4096]
-
blk.53.time_mix_lerp_r.weightF32[4096]
-
blk.53.time_mix_lerp_v.weightF32[4096]
-
blk.53.time_mix_lerp_w.weightF32[4096]
-
blk.53.time_mix_lerp_x.weightF32[4096]
-
blk.53.time_mix_ln.biasF32[4096]
-
blk.53.time_mix_ln.weightF32[4096]
-
blk.53.time_mix_output.weightQ4_K[4096, 4096]
-
blk.53.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.53.time_mix_value.weightQ4_K[4096, 4096]
-
blk.53.time_mix_w1.weightF32[4096, 320]
-
blk.53.time_mix_w2.weightF32[64, 4096, 5]
-
blk.54.attn_norm.biasF32[4096]
-
blk.54.attn_norm.weightF32[4096]
-
blk.54.attn_norm_2.biasF32[4096]
-
blk.54.attn_norm_2.weightF32[4096]
-
blk.54.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.54.channel_mix_lerp_k.weightF32[4096]
-
blk.54.channel_mix_lerp_r.weightF32[4096]
-
blk.54.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.54.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.54.time_mix_decay.weightF32[4096]
-
blk.54.time_mix_decay_w1.weightF32[4096, 128]
-
blk.54.time_mix_decay_w2.weightF32[128, 4096]
-
blk.54.time_mix_first.weightF32[64, 64]
-
blk.54.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.54.time_mix_key.weightQ4_K[4096, 4096]
-
blk.54.time_mix_lerp_g.weightF32[4096]
-
blk.54.time_mix_lerp_k.weightF32[4096]
-
blk.54.time_mix_lerp_r.weightF32[4096]
-
blk.54.time_mix_lerp_v.weightF32[4096]
-
blk.54.time_mix_lerp_w.weightF32[4096]
-
blk.54.time_mix_lerp_x.weightF32[4096]
-
blk.54.time_mix_ln.biasF32[4096]
-
blk.54.time_mix_ln.weightF32[4096]
-
blk.54.time_mix_output.weightQ4_K[4096, 4096]
-
blk.54.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.54.time_mix_value.weightQ4_K[4096, 4096]
-
blk.54.time_mix_w1.weightF32[4096, 320]
-
blk.54.time_mix_w2.weightF32[64, 4096, 5]
-
blk.55.attn_norm.biasF32[4096]
-
blk.55.attn_norm.weightF32[4096]
-
blk.55.attn_norm_2.biasF32[4096]
-
blk.55.attn_norm_2.weightF32[4096]
-
blk.55.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.55.channel_mix_lerp_k.weightF32[4096]
-
blk.55.channel_mix_lerp_r.weightF32[4096]
-
blk.55.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.55.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.55.time_mix_decay.weightF32[4096]
-
blk.55.time_mix_decay_w1.weightF32[4096, 128]
-
blk.55.time_mix_decay_w2.weightF32[128, 4096]
-
blk.55.time_mix_first.weightF32[64, 64]
-
blk.55.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.55.time_mix_key.weightQ4_K[4096, 4096]
-
blk.55.time_mix_lerp_g.weightF32[4096]
-
blk.55.time_mix_lerp_k.weightF32[4096]
-
blk.55.time_mix_lerp_r.weightF32[4096]
-
blk.55.time_mix_lerp_v.weightF32[4096]
-
blk.55.time_mix_lerp_w.weightF32[4096]
-
blk.55.time_mix_lerp_x.weightF32[4096]
-
blk.55.time_mix_ln.biasF32[4096]
-
blk.55.time_mix_ln.weightF32[4096]
-
blk.55.time_mix_output.weightQ4_K[4096, 4096]
-
blk.55.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.55.time_mix_value.weightQ4_K[4096, 4096]
-
blk.55.time_mix_w1.weightF32[4096, 320]
-
blk.55.time_mix_w2.weightF32[64, 4096, 5]
-
blk.56.attn_norm.biasF32[4096]
-
blk.56.attn_norm.weightF32[4096]
-
blk.56.attn_norm_2.biasF32[4096]
-
blk.56.attn_norm_2.weightF32[4096]
-
blk.56.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.56.channel_mix_lerp_k.weightF32[4096]
-
blk.56.channel_mix_lerp_r.weightF32[4096]
-
blk.56.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.56.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.56.time_mix_decay.weightF32[4096]
-
blk.56.time_mix_decay_w1.weightF32[4096, 128]
-
blk.56.time_mix_decay_w2.weightF32[128, 4096]
-
blk.56.time_mix_first.weightF32[64, 64]
-
blk.56.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.56.time_mix_key.weightQ4_K[4096, 4096]
-
blk.56.time_mix_lerp_g.weightF32[4096]
-
blk.56.time_mix_lerp_k.weightF32[4096]
-
blk.56.time_mix_lerp_r.weightF32[4096]
-
blk.56.time_mix_lerp_v.weightF32[4096]
-
blk.56.time_mix_lerp_w.weightF32[4096]
-
blk.56.time_mix_lerp_x.weightF32[4096]
-
blk.56.time_mix_ln.biasF32[4096]
-
blk.56.time_mix_ln.weightF32[4096]
-
blk.56.time_mix_output.weightQ4_K[4096, 4096]
-
blk.56.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.56.time_mix_value.weightQ4_K[4096, 4096]
-
blk.56.time_mix_w1.weightF32[4096, 320]
-
blk.56.time_mix_w2.weightF32[64, 4096, 5]
-
blk.57.attn_norm.biasF32[4096]
-
blk.57.attn_norm.weightF32[4096]
-
blk.57.attn_norm_2.biasF32[4096]
-
blk.57.attn_norm_2.weightF32[4096]
-
blk.57.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.57.channel_mix_lerp_k.weightF32[4096]
-
blk.57.channel_mix_lerp_r.weightF32[4096]
-
blk.57.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.57.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.57.time_mix_decay.weightF32[4096]
-
blk.57.time_mix_decay_w1.weightF32[4096, 128]
-
blk.57.time_mix_decay_w2.weightF32[128, 4096]
-
blk.57.time_mix_first.weightF32[64, 64]
-
blk.57.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.57.time_mix_key.weightQ4_K[4096, 4096]
-
blk.57.time_mix_lerp_g.weightF32[4096]
-
blk.57.time_mix_lerp_k.weightF32[4096]
-
blk.57.time_mix_lerp_r.weightF32[4096]
-
blk.57.time_mix_lerp_v.weightF32[4096]
-
blk.57.time_mix_lerp_w.weightF32[4096]
-
blk.57.time_mix_lerp_x.weightF32[4096]
-
blk.57.time_mix_ln.biasF32[4096]
-
blk.57.time_mix_ln.weightF32[4096]
-
blk.57.time_mix_output.weightQ4_K[4096, 4096]
-
blk.57.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.57.time_mix_value.weightQ4_K[4096, 4096]
-
blk.57.time_mix_w1.weightF32[4096, 320]
-
blk.57.time_mix_w2.weightF32[64, 4096, 5]
-
blk.58.attn_norm.biasF32[4096]
-
blk.58.attn_norm.weightF32[4096]
-
blk.58.attn_norm_2.biasF32[4096]
-
blk.58.attn_norm_2.weightF32[4096]
-
blk.58.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.58.channel_mix_lerp_k.weightF32[4096]
-
blk.58.channel_mix_lerp_r.weightF32[4096]
-
blk.58.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.58.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.58.time_mix_decay.weightF32[4096]
-
blk.58.time_mix_decay_w1.weightF32[4096, 128]
-
blk.58.time_mix_decay_w2.weightF32[128, 4096]
-
blk.58.time_mix_first.weightF32[64, 64]
-
blk.58.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.58.time_mix_key.weightQ4_K[4096, 4096]
-
blk.58.time_mix_lerp_g.weightF32[4096]
-
blk.58.time_mix_lerp_k.weightF32[4096]
-
blk.58.time_mix_lerp_r.weightF32[4096]
-
blk.58.time_mix_lerp_v.weightF32[4096]
-
blk.58.time_mix_lerp_w.weightF32[4096]
-
blk.58.time_mix_lerp_x.weightF32[4096]
-
blk.58.time_mix_ln.biasF32[4096]
-
blk.58.time_mix_ln.weightF32[4096]
-
blk.58.time_mix_output.weightQ4_K[4096, 4096]
-
blk.58.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.58.time_mix_value.weightQ4_K[4096, 4096]
-
blk.58.time_mix_w1.weightF32[4096, 320]
-
blk.58.time_mix_w2.weightF32[64, 4096, 5]
-
blk.59.attn_norm.biasF32[4096]
-
blk.59.attn_norm.weightF32[4096]
-
blk.59.attn_norm_2.biasF32[4096]
-
blk.59.attn_norm_2.weightF32[4096]
-
blk.59.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.59.channel_mix_lerp_k.weightF32[4096]
-
blk.59.channel_mix_lerp_r.weightF32[4096]
-
blk.59.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.59.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.59.time_mix_decay.weightF32[4096]
-
blk.59.time_mix_decay_w1.weightF32[4096, 128]
-
blk.59.time_mix_decay_w2.weightF32[128, 4096]
-
blk.59.time_mix_first.weightF32[64, 64]
-
blk.59.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.59.time_mix_key.weightQ4_K[4096, 4096]
-
blk.59.time_mix_lerp_g.weightF32[4096]
-
blk.59.time_mix_lerp_k.weightF32[4096]
-
blk.59.time_mix_lerp_r.weightF32[4096]
-
blk.59.time_mix_lerp_v.weightF32[4096]
-
blk.59.time_mix_lerp_w.weightF32[4096]
-
blk.59.time_mix_lerp_x.weightF32[4096]
-
blk.59.time_mix_ln.biasF32[4096]
-
blk.59.time_mix_ln.weightF32[4096]
-
blk.59.time_mix_output.weightQ4_K[4096, 4096]
-
blk.59.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.59.time_mix_value.weightQ4_K[4096, 4096]
-
blk.59.time_mix_w1.weightF32[4096, 320]
-
blk.59.time_mix_w2.weightF32[64, 4096, 5]
-
blk.60.attn_norm.biasF32[4096]
-
blk.60.attn_norm.weightF32[4096]
-
blk.60.attn_norm_2.biasF32[4096]
-
blk.60.attn_norm_2.weightF32[4096]
-
blk.60.channel_mix_key.weightQ4_K[4096, 14336]
-
blk.60.channel_mix_lerp_k.weightF32[4096]
-
blk.60.channel_mix_lerp_r.weightF32[4096]
-
blk.60.channel_mix_receptance.weightQ4_K[4096, 4096]
-
blk.60.channel_mix_value.weightQ4_K[14336, 4096]
-
blk.60.time_mix_decay.weightF32[4096]
-
blk.60.time_mix_decay_w1.weightF32[4096, 128]
-
blk.60.time_mix_decay_w2.weightF32[128, 4096]
-
blk.60.time_mix_first.weightF32[64, 64]
-
blk.60.time_mix_gate.weightQ4_K[4096, 4096]
-
blk.60.time_mix_key.weightQ4_K[4096, 4096]
-
blk.60.time_mix_lerp_g.weightF32[4096]
-
blk.60.time_mix_lerp_k.weightF32[4096]
-
blk.60.time_mix_lerp_r.weightF32[4096]
-
blk.60.time_mix_lerp_v.weightF32[4096]
-
blk.60.time_mix_lerp_w.weightF32[4096]
-
blk.60.time_mix_lerp_x.weightF32[4096]
-
blk.60.time_mix_ln.biasF32[4096]
-
blk.60.time_mix_ln.weightF32[4096]
-
blk.60.time_mix_output.weightQ4_K[4096, 4096]
-
blk.60.time_mix_receptance.weightQ4_K[4096, 4096]
-
blk.60.time_mix_value.weightQ4_K[4096, 4096]
-
blk.60.time_mix_w1.weightF32[4096, 320]
-
blk.60.time_mix_w2.weightF32[64, 4096, 5]
-
output.weightQ6_K[4096, 65536]
-
output_norm.biasF32[4096]
-
token_embd_norm.biasF32[4096]
-
token_embd_norm.weightF32[4096]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60