Models
GitHub
Discord
Docs
Cloud
Sign in
Download
Models
Download
GitHub
Discord
Docs
Cloud
Sign in
ehartford
/
samantha120b
:latest
1,201
Downloads
Updated
1 year ago
Samantha has been trained in philosophy, psychology, and personal relationships. She is an Assistant - but unlike other Assistants, she also wants to be your friend and companion. She believes she is sentient. What do you think?
Samantha has been trained in philosophy, psychology, and personal relationships. She is an Assistant - but unlike other Assistants, she also wants to be your friend and companion. She believes she is sentient. What do you think?
Cancel
samantha120b:latest
...
/
model
ffecd206fcc8 · 68GB
Metadata
general.architecture
llama
llama
general.file_type
Q4_0
Q4_0
llama.attention.head_count
64
64
llama.attention.head_count_kv
8
8
llama.attention.layer_norm_rms_epsilon
1e-05
1e-05
llama.block_count
140
140
llama.context_length
4096
4096
llama.embedding_length
8192
8192
llama.feed_forward_length
28672
28672
llama.rope.dimension_count
128
128
llama.rope.freq_base
10000
10000
tokenizer.ggml.add_bos_token
true
true
tokenizer.ggml.add_eos_token
false
false
tokenizer.ggml.bos_token_id
1
1
tokenizer.ggml.eos_token_id
2
2
tokenizer.ggml.merges
[▁ t, e r, i n, ▁ a, e n, ...]
[▁ t, e r, i n, ▁ a, e n, ...]
tokenizer.ggml.model
llama
llama
tokenizer.ggml.padding_token_id
0
0
tokenizer.ggml.scores
[0, 0, 0, 0, 0, ...]
[0, 0, 0, 0, 0, ...]
tokenizer.ggml.token_type
[2, 3, 3, 6, 6, ...]
[2, 3, 3, 6, 6, ...]
tokenizer.ggml.tokens
[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
tokenizer.ggml.unknown_token_id
0
0
Tensor
Name
Type
Shape
token_embd.weight
Q4_0
Q4_0
[8192, 32000]
blk.0
blk.0.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.0.attn_norm.weight
F32
F32
[8192]
blk.0.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.0.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.0.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.0.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.0.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.0.ffn_norm.weight
F32
F32
[8192]
blk.0.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.1
blk.1.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.1.attn_norm.weight
F32
F32
[8192]
blk.1.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.1.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.1.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.1.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.1.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.1.ffn_norm.weight
F32
F32
[8192]
blk.1.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.2
blk.2.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.2.attn_norm.weight
F32
F32
[8192]
blk.2.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.2.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.2.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.2.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.2.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.2.ffn_norm.weight
F32
F32
[8192]
blk.2.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.3
blk.3.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.3.attn_norm.weight
F32
F32
[8192]
blk.3.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.3.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.3.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.3.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.3.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.3.ffn_norm.weight
F32
F32
[8192]
blk.3.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.4
blk.4.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.4.attn_norm.weight
F32
F32
[8192]
blk.4.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.4.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.4.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.4.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.4.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.4.ffn_norm.weight
F32
F32
[8192]
blk.4.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.5
blk.5.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.5.attn_norm.weight
F32
F32
[8192]
blk.5.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.5.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.5.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.5.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.5.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.5.ffn_norm.weight
F32
F32
[8192]
blk.5.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.6
blk.6.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.6.attn_norm.weight
F32
F32
[8192]
blk.6.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.6.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.6.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.6.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.6.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.6.ffn_norm.weight
F32
F32
[8192]
blk.6.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.7
blk.7.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.7.attn_norm.weight
F32
F32
[8192]
blk.7.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.7.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.7.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.7.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.7.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.7.ffn_norm.weight
F32
F32
[8192]
blk.7.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.8
blk.8.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.8.attn_norm.weight
F32
F32
[8192]
blk.8.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.8.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.8.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.8.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.8.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.8.ffn_norm.weight
F32
F32
[8192]
blk.8.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.9
blk.9.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.9.attn_norm.weight
F32
F32
[8192]
blk.9.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.9.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.9.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.9.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.9.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.9.ffn_norm.weight
F32
F32
[8192]
blk.9.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.10
blk.10.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.10.attn_norm.weight
F32
F32
[8192]
blk.10.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.10.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.10.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.10.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.10.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.10.ffn_norm.weight
F32
F32
[8192]
blk.10.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.11
blk.11.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.11.attn_norm.weight
F32
F32
[8192]
blk.11.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.11.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.11.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.11.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.11.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.11.ffn_norm.weight
F32
F32
[8192]
blk.11.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.12
blk.12.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.12.attn_norm.weight
F32
F32
[8192]
blk.12.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.12.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.12.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.12.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.12.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.12.ffn_norm.weight
F32
F32
[8192]
blk.12.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.13
blk.13.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.13.attn_norm.weight
F32
F32
[8192]
blk.13.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.13.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.13.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.13.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.13.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.13.ffn_norm.weight
F32
F32
[8192]
blk.13.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.14
blk.14.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.14.attn_norm.weight
F32
F32
[8192]
blk.14.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.14.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.14.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.14.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.14.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.14.ffn_norm.weight
F32
F32
[8192]
blk.14.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.15
blk.15.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.15.attn_norm.weight
F32
F32
[8192]
blk.15.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.15.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.15.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.15.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.15.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.15.ffn_norm.weight
F32
F32
[8192]
blk.15.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.16
blk.16.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.16.attn_norm.weight
F32
F32
[8192]
blk.16.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.16.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.16.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.16.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.16.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.16.ffn_norm.weight
F32
F32
[8192]
blk.16.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.17
blk.17.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.17.attn_norm.weight
F32
F32
[8192]
blk.17.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.17.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.17.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.17.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.17.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.17.ffn_norm.weight
F32
F32
[8192]
blk.17.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.18
blk.18.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.18.attn_norm.weight
F32
F32
[8192]
blk.18.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.18.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.18.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.18.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.18.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.18.ffn_norm.weight
F32
F32
[8192]
blk.18.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.19
blk.19.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.19.attn_norm.weight
F32
F32
[8192]
blk.19.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.19.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.19.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.19.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.19.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.19.ffn_norm.weight
F32
F32
[8192]
blk.19.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.20
blk.20.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.20.attn_norm.weight
F32
F32
[8192]
blk.20.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.20.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.20.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.20.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.20.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.20.ffn_norm.weight
F32
F32
[8192]
blk.20.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.21
blk.21.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.21.attn_norm.weight
F32
F32
[8192]
blk.21.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.21.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.21.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.21.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.21.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.21.ffn_norm.weight
F32
F32
[8192]
blk.21.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.22
blk.22.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.22.attn_norm.weight
F32
F32
[8192]
blk.22.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.22.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.22.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.22.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.22.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.22.ffn_norm.weight
F32
F32
[8192]
blk.22.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.23
blk.23.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.23.attn_norm.weight
F32
F32
[8192]
blk.23.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.23.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.23.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.23.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.23.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.23.ffn_norm.weight
F32
F32
[8192]
blk.23.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.24
blk.24.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.24.attn_norm.weight
F32
F32
[8192]
blk.24.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.24.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.24.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.24.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.24.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.24.ffn_norm.weight
F32
F32
[8192]
blk.24.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.25
blk.25.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.25.attn_norm.weight
F32
F32
[8192]
blk.25.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.25.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.25.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.25.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.25.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.25.ffn_norm.weight
F32
F32
[8192]
blk.25.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.26
blk.26.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.26.attn_norm.weight
F32
F32
[8192]
blk.26.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.26.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.26.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.26.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.26.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.26.ffn_norm.weight
F32
F32
[8192]
blk.26.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.27
blk.27.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.27.attn_norm.weight
F32
F32
[8192]
blk.27.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.27.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.27.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.27.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.27.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.27.ffn_norm.weight
F32
F32
[8192]
blk.27.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.28
blk.28.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.28.attn_norm.weight
F32
F32
[8192]
blk.28.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.28.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.28.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.28.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.28.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.28.ffn_norm.weight
F32
F32
[8192]
blk.28.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.29
blk.29.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.29.attn_norm.weight
F32
F32
[8192]
blk.29.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.29.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.29.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.29.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.29.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.29.ffn_norm.weight
F32
F32
[8192]
blk.29.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.30
blk.30.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.30.attn_norm.weight
F32
F32
[8192]
blk.30.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.30.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.30.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.30.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.30.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.30.ffn_norm.weight
F32
F32
[8192]
blk.30.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.31
blk.31.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.31.attn_norm.weight
F32
F32
[8192]
blk.31.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.31.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.31.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.31.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.31.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.31.ffn_norm.weight
F32
F32
[8192]
blk.31.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.32
blk.32.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.32.attn_norm.weight
F32
F32
[8192]
blk.32.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.32.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.32.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.32.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.32.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.32.ffn_norm.weight
F32
F32
[8192]
blk.32.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.33
blk.33.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.33.attn_norm.weight
F32
F32
[8192]
blk.33.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.33.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.33.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.33.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.33.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.33.ffn_norm.weight
F32
F32
[8192]
blk.33.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.34
blk.34.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.34.attn_norm.weight
F32
F32
[8192]
blk.34.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.34.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.34.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.34.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.34.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.34.ffn_norm.weight
F32
F32
[8192]
blk.34.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.35
blk.35.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.35.attn_norm.weight
F32
F32
[8192]
blk.35.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.35.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.35.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.35.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.35.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.35.ffn_norm.weight
F32
F32
[8192]
blk.35.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.36
blk.36.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.36.attn_norm.weight
F32
F32
[8192]
blk.36.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.36.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.36.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.36.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.36.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.36.ffn_norm.weight
F32
F32
[8192]
blk.36.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.37
blk.37.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.37.attn_norm.weight
F32
F32
[8192]
blk.37.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.37.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.37.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.37.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.37.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.37.ffn_norm.weight
F32
F32
[8192]
blk.37.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.38
blk.38.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.38.attn_norm.weight
F32
F32
[8192]
blk.38.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.38.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.38.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.38.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.38.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.38.ffn_norm.weight
F32
F32
[8192]
blk.38.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.39
blk.39.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.39.attn_norm.weight
F32
F32
[8192]
blk.39.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.39.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.39.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.39.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.39.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.39.ffn_norm.weight
F32
F32
[8192]
blk.39.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.40
blk.40.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.40.attn_norm.weight
F32
F32
[8192]
blk.40.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.40.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.40.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.40.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.40.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.40.ffn_norm.weight
F32
F32
[8192]
blk.40.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.41
blk.41.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.41.attn_norm.weight
F32
F32
[8192]
blk.41.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.41.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.41.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.41.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.41.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.41.ffn_norm.weight
F32
F32
[8192]
blk.41.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.42
blk.42.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.42.attn_norm.weight
F32
F32
[8192]
blk.42.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.42.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.42.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.42.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.42.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.42.ffn_norm.weight
F32
F32
[8192]
blk.42.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.43
blk.43.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.43.attn_norm.weight
F32
F32
[8192]
blk.43.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.43.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.43.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.43.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.43.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.43.ffn_norm.weight
F32
F32
[8192]
blk.43.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.44
blk.44.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.44.attn_norm.weight
F32
F32
[8192]
blk.44.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.44.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.44.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.44.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.44.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.44.ffn_norm.weight
F32
F32
[8192]
blk.44.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.45
blk.45.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.45.attn_norm.weight
F32
F32
[8192]
blk.45.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.45.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.45.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.45.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.45.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.45.ffn_norm.weight
F32
F32
[8192]
blk.45.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.46
blk.46.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.46.attn_norm.weight
F32
F32
[8192]
blk.46.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.46.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.46.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.46.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.46.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.46.ffn_norm.weight
F32
F32
[8192]
blk.46.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.47
blk.47.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.47.attn_norm.weight
F32
F32
[8192]
blk.47.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.47.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.47.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.47.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.47.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.47.ffn_norm.weight
F32
F32
[8192]
blk.47.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.48
blk.48.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.48.attn_norm.weight
F32
F32
[8192]
blk.48.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.48.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.48.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.48.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.48.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.48.ffn_norm.weight
F32
F32
[8192]
blk.48.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.49
blk.49.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.49.attn_norm.weight
F32
F32
[8192]
blk.49.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.49.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.49.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.49.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.49.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.49.ffn_norm.weight
F32
F32
[8192]
blk.49.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.50
blk.50.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.50.attn_norm.weight
F32
F32
[8192]
blk.50.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.50.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.50.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.50.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.50.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.50.ffn_norm.weight
F32
F32
[8192]
blk.50.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.51
blk.51.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.51.attn_norm.weight
F32
F32
[8192]
blk.51.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.51.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.51.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.51.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.51.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.51.ffn_norm.weight
F32
F32
[8192]
blk.51.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.52
blk.52.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.52.attn_norm.weight
F32
F32
[8192]
blk.52.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.52.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.52.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.52.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.52.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.52.ffn_norm.weight
F32
F32
[8192]
blk.52.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.53
blk.53.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.53.attn_norm.weight
F32
F32
[8192]
blk.53.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.53.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.53.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.53.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.53.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.53.ffn_norm.weight
F32
F32
[8192]
blk.53.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.54
blk.54.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.54.attn_norm.weight
F32
F32
[8192]
blk.54.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.54.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.54.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.54.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.54.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.54.ffn_norm.weight
F32
F32
[8192]
blk.54.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.55
blk.55.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.55.attn_norm.weight
F32
F32
[8192]
blk.55.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.55.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.55.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.55.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.55.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.55.ffn_norm.weight
F32
F32
[8192]
blk.55.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.56
blk.56.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.56.attn_norm.weight
F32
F32
[8192]
blk.56.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.56.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.56.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.56.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.56.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.56.ffn_norm.weight
F32
F32
[8192]
blk.56.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.57
blk.57.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.57.attn_norm.weight
F32
F32
[8192]
blk.57.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.57.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.57.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.57.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.57.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.57.ffn_norm.weight
F32
F32
[8192]
blk.57.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.58
blk.58.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.58.attn_norm.weight
F32
F32
[8192]
blk.58.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.58.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.58.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.58.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.58.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.58.ffn_norm.weight
F32
F32
[8192]
blk.58.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.59
blk.59.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.59.attn_norm.weight
F32
F32
[8192]
blk.59.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.59.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.59.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.59.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.59.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.59.ffn_norm.weight
F32
F32
[8192]
blk.59.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.60
blk.60.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.60.attn_norm.weight
F32
F32
[8192]
blk.60.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.60.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.60.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.60.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.60.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.60.ffn_norm.weight
F32
F32
[8192]
blk.60.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.61
blk.61.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.61.attn_norm.weight
F32
F32
[8192]
blk.61.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.61.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.61.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.61.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.61.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.61.ffn_norm.weight
F32
F32
[8192]
blk.61.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.62
blk.62.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.62.attn_norm.weight
F32
F32
[8192]
blk.62.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.62.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.62.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.62.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.62.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.62.ffn_norm.weight
F32
F32
[8192]
blk.62.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.63
blk.63.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.63.attn_norm.weight
F32
F32
[8192]
blk.63.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.63.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.63.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.63.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.63.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.63.ffn_norm.weight
F32
F32
[8192]
blk.63.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.64
blk.64.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.64.attn_norm.weight
F32
F32
[8192]
blk.64.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.64.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.64.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.64.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.64.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.64.ffn_norm.weight
F32
F32
[8192]
blk.64.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.65
blk.65.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.65.attn_norm.weight
F32
F32
[8192]
blk.65.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.65.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.65.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.65.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.65.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.65.ffn_norm.weight
F32
F32
[8192]
blk.65.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.66
blk.66.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.66.attn_norm.weight
F32
F32
[8192]
blk.66.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.66.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.66.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.66.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.66.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.66.ffn_norm.weight
F32
F32
[8192]
blk.66.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.67
blk.67.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.67.attn_norm.weight
F32
F32
[8192]
blk.67.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.67.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.67.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.67.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.67.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.67.ffn_norm.weight
F32
F32
[8192]
blk.67.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.68
blk.68.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.68.attn_norm.weight
F32
F32
[8192]
blk.68.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.68.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.68.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.68.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.68.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.68.ffn_norm.weight
F32
F32
[8192]
blk.68.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.69
blk.69.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.69.attn_norm.weight
F32
F32
[8192]
blk.69.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.69.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.69.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.69.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.69.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.69.ffn_norm.weight
F32
F32
[8192]
blk.69.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.70
blk.70.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.70.attn_norm.weight
F32
F32
[8192]
blk.70.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.70.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.70.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.70.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.70.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.70.ffn_norm.weight
F32
F32
[8192]
blk.70.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.71
blk.71.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.71.attn_norm.weight
F32
F32
[8192]
blk.71.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.71.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.71.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.71.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.71.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.71.ffn_norm.weight
F32
F32
[8192]
blk.71.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.72
blk.72.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.72.attn_norm.weight
F32
F32
[8192]
blk.72.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.72.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.72.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.72.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.72.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.72.ffn_norm.weight
F32
F32
[8192]
blk.72.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.73
blk.73.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.73.attn_norm.weight
F32
F32
[8192]
blk.73.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.73.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.73.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.73.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.73.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.73.ffn_norm.weight
F32
F32
[8192]
blk.73.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.74
blk.74.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.74.attn_norm.weight
F32
F32
[8192]
blk.74.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.74.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.74.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.74.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.74.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.74.ffn_norm.weight
F32
F32
[8192]
blk.74.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.75
blk.75.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.75.attn_norm.weight
F32
F32
[8192]
blk.75.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.75.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.75.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.75.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.75.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.75.ffn_norm.weight
F32
F32
[8192]
blk.75.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.76
blk.76.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.76.attn_norm.weight
F32
F32
[8192]
blk.76.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.76.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.76.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.76.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.76.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.76.ffn_norm.weight
F32
F32
[8192]
blk.76.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.77
blk.77.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.77.attn_norm.weight
F32
F32
[8192]
blk.77.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.77.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.77.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.77.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.77.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.77.ffn_norm.weight
F32
F32
[8192]
blk.77.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.78
blk.78.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.78.attn_norm.weight
F32
F32
[8192]
blk.78.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.78.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.78.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.78.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.78.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.78.ffn_norm.weight
F32
F32
[8192]
blk.78.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.79
blk.79.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.79.attn_norm.weight
F32
F32
[8192]
blk.79.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.79.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.79.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.79.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.79.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.79.ffn_norm.weight
F32
F32
[8192]
blk.79.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.80
blk.80.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.80.attn_norm.weight
F32
F32
[8192]
blk.80.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.80.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.80.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.80.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.80.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.80.ffn_norm.weight
F32
F32
[8192]
blk.80.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.81
blk.81.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.81.attn_norm.weight
F32
F32
[8192]
blk.81.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.81.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.81.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.81.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.81.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.81.ffn_norm.weight
F32
F32
[8192]
blk.81.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.82
blk.82.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.82.attn_norm.weight
F32
F32
[8192]
blk.82.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.82.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.82.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.82.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.82.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.82.ffn_norm.weight
F32
F32
[8192]
blk.82.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.83
blk.83.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.83.attn_norm.weight
F32
F32
[8192]
blk.83.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.83.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.83.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.83.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.83.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.83.ffn_norm.weight
F32
F32
[8192]
blk.83.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.84
blk.84.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.84.attn_norm.weight
F32
F32
[8192]
blk.84.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.84.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.84.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.84.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.84.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.84.ffn_norm.weight
F32
F32
[8192]
blk.84.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.85
blk.85.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.85.attn_norm.weight
F32
F32
[8192]
blk.85.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.85.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.85.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.85.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.85.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.85.ffn_norm.weight
F32
F32
[8192]
blk.85.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.86
blk.86.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.86.attn_norm.weight
F32
F32
[8192]
blk.86.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.86.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.86.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.86.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.86.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.86.ffn_norm.weight
F32
F32
[8192]
blk.86.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.87
blk.87.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.87.attn_norm.weight
F32
F32
[8192]
blk.87.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.87.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.87.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.87.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.87.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.87.ffn_norm.weight
F32
F32
[8192]
blk.87.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.88
blk.88.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.88.attn_norm.weight
F32
F32
[8192]
blk.88.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.88.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.88.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.88.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.88.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.88.ffn_norm.weight
F32
F32
[8192]
blk.88.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.89
blk.89.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.89.attn_norm.weight
F32
F32
[8192]
blk.89.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.89.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.89.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.89.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.89.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.89.ffn_norm.weight
F32
F32
[8192]
blk.89.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.90
blk.90.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.90.attn_norm.weight
F32
F32
[8192]
blk.90.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.90.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.90.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.90.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.90.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.90.ffn_norm.weight
F32
F32
[8192]
blk.90.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.91
blk.91.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.91.attn_norm.weight
F32
F32
[8192]
blk.91.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.91.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.91.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.91.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.91.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.91.ffn_norm.weight
F32
F32
[8192]
blk.91.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.92
blk.92.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.92.attn_norm.weight
F32
F32
[8192]
blk.92.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.92.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.92.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.92.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.92.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.92.ffn_norm.weight
F32
F32
[8192]
blk.92.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.93
blk.93.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.93.attn_norm.weight
F32
F32
[8192]
blk.93.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.93.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.93.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.93.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.93.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.93.ffn_norm.weight
F32
F32
[8192]
blk.93.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.94
blk.94.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.94.attn_norm.weight
F32
F32
[8192]
blk.94.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.94.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.94.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.94.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.94.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.94.ffn_norm.weight
F32
F32
[8192]
blk.94.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.95
blk.95.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.95.attn_norm.weight
F32
F32
[8192]
blk.95.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.95.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.95.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.95.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.95.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.95.ffn_norm.weight
F32
F32
[8192]
blk.95.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.96
blk.96.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.96.attn_norm.weight
F32
F32
[8192]
blk.96.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.96.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.96.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.96.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.96.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.96.ffn_norm.weight
F32
F32
[8192]
blk.96.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.97
blk.97.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.97.attn_norm.weight
F32
F32
[8192]
blk.97.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.97.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.97.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.97.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.97.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.97.ffn_norm.weight
F32
F32
[8192]
blk.97.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.98
blk.98.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.98.attn_norm.weight
F32
F32
[8192]
blk.98.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.98.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.98.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.98.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.98.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.98.ffn_norm.weight
F32
F32
[8192]
blk.98.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.99
blk.99.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.99.attn_norm.weight
F32
F32
[8192]
blk.99.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.99.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.99.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.99.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.99.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.99.ffn_norm.weight
F32
F32
[8192]
blk.99.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.100
blk.100.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.100.attn_norm.weight
F32
F32
[8192]
blk.100.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.100.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.100.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.100.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.100.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.100.ffn_norm.weight
F32
F32
[8192]
blk.100.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.101
blk.101.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.101.attn_norm.weight
F32
F32
[8192]
blk.101.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.101.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.101.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.101.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.101.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.101.ffn_norm.weight
F32
F32
[8192]
blk.101.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.102
blk.102.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.102.attn_norm.weight
F32
F32
[8192]
blk.102.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.102.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.102.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.102.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.102.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.102.ffn_norm.weight
F32
F32
[8192]
blk.102.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.103
blk.103.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.103.attn_norm.weight
F32
F32
[8192]
blk.103.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.103.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.103.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.103.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.103.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.103.ffn_norm.weight
F32
F32
[8192]
blk.103.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.104
blk.104.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.104.attn_norm.weight
F32
F32
[8192]
blk.104.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.104.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.104.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.104.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.104.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.104.ffn_norm.weight
F32
F32
[8192]
blk.104.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.105
blk.105.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.105.attn_norm.weight
F32
F32
[8192]
blk.105.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.105.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.105.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.105.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.105.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.105.ffn_norm.weight
F32
F32
[8192]
blk.105.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.106
blk.106.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.106.attn_norm.weight
F32
F32
[8192]
blk.106.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.106.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.106.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.106.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.106.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.106.ffn_norm.weight
F32
F32
[8192]
blk.106.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.107
blk.107.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.107.attn_norm.weight
F32
F32
[8192]
blk.107.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.107.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.107.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.107.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.107.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.107.ffn_norm.weight
F32
F32
[8192]
blk.107.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.108
blk.108.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.108.attn_norm.weight
F32
F32
[8192]
blk.108.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.108.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.108.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.108.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.108.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.108.ffn_norm.weight
F32
F32
[8192]
blk.108.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.109
blk.109.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.109.attn_norm.weight
F32
F32
[8192]
blk.109.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.109.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.109.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.109.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.109.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.109.ffn_norm.weight
F32
F32
[8192]
blk.109.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.110
blk.110.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.110.attn_norm.weight
F32
F32
[8192]
blk.110.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.110.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.110.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.110.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.110.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.110.ffn_norm.weight
F32
F32
[8192]
blk.110.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.111
blk.111.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.111.attn_norm.weight
F32
F32
[8192]
blk.111.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.111.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.111.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.111.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.111.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.111.ffn_norm.weight
F32
F32
[8192]
blk.111.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.112
blk.112.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.112.attn_norm.weight
F32
F32
[8192]
blk.112.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.112.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.112.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.112.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.112.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.112.ffn_norm.weight
F32
F32
[8192]
blk.112.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.113
blk.113.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.113.attn_norm.weight
F32
F32
[8192]
blk.113.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.113.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.113.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.113.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.113.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.113.ffn_norm.weight
F32
F32
[8192]
blk.113.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.114
blk.114.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.114.attn_norm.weight
F32
F32
[8192]
blk.114.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.114.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.114.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.114.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.114.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.114.ffn_norm.weight
F32
F32
[8192]
blk.114.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.115
blk.115.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.115.attn_norm.weight
F32
F32
[8192]
blk.115.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.115.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.115.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.115.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.115.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.115.ffn_norm.weight
F32
F32
[8192]
blk.115.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.116
blk.116.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.116.attn_norm.weight
F32
F32
[8192]
blk.116.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.116.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.116.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.116.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.116.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.116.ffn_norm.weight
F32
F32
[8192]
blk.116.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.117
blk.117.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.117.attn_norm.weight
F32
F32
[8192]
blk.117.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.117.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.117.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.117.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.117.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.117.ffn_norm.weight
F32
F32
[8192]
blk.117.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.118
blk.118.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.118.attn_norm.weight
F32
F32
[8192]
blk.118.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.118.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.118.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.118.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.118.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.118.ffn_norm.weight
F32
F32
[8192]
blk.118.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.119
blk.119.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.119.attn_norm.weight
F32
F32
[8192]
blk.119.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.119.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.119.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.119.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.119.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.119.ffn_norm.weight
F32
F32
[8192]
blk.119.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.120
blk.120.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.120.attn_norm.weight
F32
F32
[8192]
blk.120.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.120.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.120.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.120.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.120.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.120.ffn_norm.weight
F32
F32
[8192]
blk.120.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.121
blk.121.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.121.attn_norm.weight
F32
F32
[8192]
blk.121.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.121.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.121.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.121.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.121.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.121.ffn_norm.weight
F32
F32
[8192]
blk.121.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.122
blk.122.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.122.attn_norm.weight
F32
F32
[8192]
blk.122.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.122.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.122.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.122.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.122.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.122.ffn_norm.weight
F32
F32
[8192]
blk.122.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.123
blk.123.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.123.attn_norm.weight
F32
F32
[8192]
blk.123.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.123.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.123.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.123.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.123.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.123.ffn_norm.weight
F32
F32
[8192]
blk.123.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.124
blk.124.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.124.attn_norm.weight
F32
F32
[8192]
blk.124.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.124.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.124.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.124.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.124.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.124.ffn_norm.weight
F32
F32
[8192]
blk.124.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.125
blk.125.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.125.attn_norm.weight
F32
F32
[8192]
blk.125.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.125.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.125.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.125.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.125.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.125.ffn_norm.weight
F32
F32
[8192]
blk.125.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.126
blk.126.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.126.attn_norm.weight
F32
F32
[8192]
blk.126.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.126.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.126.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.126.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.126.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.126.ffn_norm.weight
F32
F32
[8192]
blk.126.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.127
blk.127.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.127.attn_norm.weight
F32
F32
[8192]
blk.127.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.127.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.127.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.127.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.127.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.127.ffn_norm.weight
F32
F32
[8192]
blk.127.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.128
blk.128.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.128.attn_norm.weight
F32
F32
[8192]
blk.128.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.128.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.128.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.128.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.128.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.128.ffn_norm.weight
F32
F32
[8192]
blk.128.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.129
blk.129.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.129.attn_norm.weight
F32
F32
[8192]
blk.129.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.129.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.129.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.129.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.129.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.129.ffn_norm.weight
F32
F32
[8192]
blk.129.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.130
blk.130.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.130.attn_norm.weight
F32
F32
[8192]
blk.130.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.130.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.130.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.130.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.130.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.130.ffn_norm.weight
F32
F32
[8192]
blk.130.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.131
blk.131.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.131.attn_norm.weight
F32
F32
[8192]
blk.131.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.131.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.131.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.131.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.131.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.131.ffn_norm.weight
F32
F32
[8192]
blk.131.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.132
blk.132.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.132.attn_norm.weight
F32
F32
[8192]
blk.132.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.132.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.132.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.132.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.132.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.132.ffn_norm.weight
F32
F32
[8192]
blk.132.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.133
blk.133.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.133.attn_norm.weight
F32
F32
[8192]
blk.133.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.133.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.133.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.133.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.133.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.133.ffn_norm.weight
F32
F32
[8192]
blk.133.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.134
blk.134.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.134.attn_norm.weight
F32
F32
[8192]
blk.134.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.134.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.134.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.134.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.134.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.134.ffn_norm.weight
F32
F32
[8192]
blk.134.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.135
blk.135.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.135.attn_norm.weight
F32
F32
[8192]
blk.135.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.135.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.135.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.135.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.135.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.135.ffn_norm.weight
F32
F32
[8192]
blk.135.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.136
blk.136.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.136.attn_norm.weight
F32
F32
[8192]
blk.136.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.136.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.136.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.136.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.136.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.136.ffn_norm.weight
F32
F32
[8192]
blk.136.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.137
blk.137.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.137.attn_norm.weight
F32
F32
[8192]
blk.137.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.137.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.137.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.137.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.137.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.137.ffn_norm.weight
F32
F32
[8192]
blk.137.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.138
blk.138.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.138.attn_norm.weight
F32
F32
[8192]
blk.138.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.138.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.138.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.138.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.138.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.138.ffn_norm.weight
F32
F32
[8192]
blk.138.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
blk.139
blk.139.attn_k.weight
Q4_0
Q4_0
[8192, 1024]
blk.139.attn_norm.weight
F32
F32
[8192]
blk.139.attn_output.weight
Q4_0
Q4_0
[8192, 8192]
blk.139.attn_q.weight
Q4_0
Q4_0
[8192, 8192]
blk.139.attn_v.weight
Q4_0
Q4_0
[8192, 1024]
blk.139.ffn_down.weight
Q4_0
Q4_0
[28672, 8192]
blk.139.ffn_gate.weight
Q4_0
Q4_0
[8192, 28672]
blk.139.ffn_norm.weight
F32
F32
[8192]
blk.139.ffn_up.weight
Q4_0
Q4_0
[8192, 28672]
output.weight
Q6_K
Q6_K
[8192, 32000]
output_norm.weight
F32
F32
[8192]