Models
GitHub
Discord
Turbo
Sign in
Download
Models
Download
GitHub
Discord
Sign in
exaone-deep
:32b-q8_0
149.6K
Downloads
Updated
5 months ago
EXAONE Deep exhibits superior capabilities in various reasoning tasks including math and coding benchmarks, ranging from 2.4B to 32B parameters developed and released by LG AI Research.
EXAONE Deep exhibits superior capabilities in various reasoning tasks including math and coding benchmarks, ranging from 2.4B to 32B parameters developed and released by LG AI Research.
Cancel
2.4b
7.8b
32b
exaone-deep:32b-q8_0
...
/
model
e19c9bb175cc · 34GB
Metadata
general.architecture
exaone
exaone
general.file_type
Q8_0
Q8_0
exaone.attention.head_count
40
40
exaone.attention.head_count_kv
8
8
exaone.attention.layer_norm_rms_epsilon
1e-05
1e-05
exaone.block_count
64
64
exaone.context_length
32768
32768
exaone.embedding_length
5120
5120
exaone.feed_forward_length
27392
27392
exaone.rope.dimension_count
128
128
exaone.rope.freq_base
1e+06
1e+06
tokenizer.ggml.bos_token_id
1
1
tokenizer.ggml.eos_token_id
361
361
tokenizer.ggml.merges
[t h, Ġ a, Ġ í, i n, Ġ th, ...]
[t h, Ġ a, Ġ í, i n, Ġ th, ...]
tokenizer.ggml.model
gpt2
gpt2
tokenizer.ggml.padding_token_id
0
0
tokenizer.ggml.pre
exaone
exaone
tokenizer.ggml.token_type
[3, 3, 3, 3, 4, ...]
[3, 3, 3, 3, 4, ...]
tokenizer.ggml.tokens
[[PAD], [BOS], [EOS], [UNK], , ...]
[[PAD], [BOS], [EOS], [UNK], , ...]
tokenizer.ggml.unknown_token_id
3
3
Tensor
Name
Type
Shape
token_embd.weight
Q8_0
Q8_0
[5120, 102400]
blk.0
blk.0.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.0.attn_norm.weight
F32
F32
[5120]
blk.0.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.0.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.0.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.0.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.0.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.0.ffn_norm.weight
F32
F32
[5120]
blk.0.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.1
blk.1.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.1.attn_norm.weight
F32
F32
[5120]
blk.1.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.1.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.1.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.1.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.1.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.1.ffn_norm.weight
F32
F32
[5120]
blk.1.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.2
blk.2.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.2.attn_norm.weight
F32
F32
[5120]
blk.2.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.2.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.2.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.2.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.2.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.2.ffn_norm.weight
F32
F32
[5120]
blk.2.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.3
blk.3.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.3.attn_norm.weight
F32
F32
[5120]
blk.3.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.3.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.3.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.3.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.3.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.3.ffn_norm.weight
F32
F32
[5120]
blk.3.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.4
blk.4.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.4.attn_norm.weight
F32
F32
[5120]
blk.4.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.4.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.4.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.4.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.4.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.4.ffn_norm.weight
F32
F32
[5120]
blk.4.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.5
blk.5.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.5.attn_norm.weight
F32
F32
[5120]
blk.5.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.5.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.5.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.5.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.5.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.5.ffn_norm.weight
F32
F32
[5120]
blk.5.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.6
blk.6.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.6.attn_norm.weight
F32
F32
[5120]
blk.6.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.6.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.6.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.6.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.6.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.6.ffn_norm.weight
F32
F32
[5120]
blk.6.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.7
blk.7.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.7.attn_norm.weight
F32
F32
[5120]
blk.7.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.7.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.7.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.7.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.7.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.7.ffn_norm.weight
F32
F32
[5120]
blk.7.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.8
blk.8.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.8.attn_norm.weight
F32
F32
[5120]
blk.8.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.8.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.8.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.8.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.8.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.8.ffn_norm.weight
F32
F32
[5120]
blk.8.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.9
blk.9.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.9.attn_norm.weight
F32
F32
[5120]
blk.9.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.9.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.9.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.9.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.9.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.9.ffn_norm.weight
F32
F32
[5120]
blk.9.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.10
blk.10.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.10.attn_norm.weight
F32
F32
[5120]
blk.10.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.10.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.10.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.10.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.10.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.10.ffn_norm.weight
F32
F32
[5120]
blk.10.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.11
blk.11.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.11.attn_norm.weight
F32
F32
[5120]
blk.11.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.11.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.11.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.11.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.11.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.11.ffn_norm.weight
F32
F32
[5120]
blk.11.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.12
blk.12.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.12.attn_norm.weight
F32
F32
[5120]
blk.12.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.12.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.12.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.12.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.12.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.12.ffn_norm.weight
F32
F32
[5120]
blk.12.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.13
blk.13.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.13.attn_norm.weight
F32
F32
[5120]
blk.13.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.13.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.13.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.13.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.13.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.13.ffn_norm.weight
F32
F32
[5120]
blk.13.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.14
blk.14.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.14.attn_norm.weight
F32
F32
[5120]
blk.14.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.14.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.14.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.14.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.14.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.14.ffn_norm.weight
F32
F32
[5120]
blk.14.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.15
blk.15.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.15.attn_norm.weight
F32
F32
[5120]
blk.15.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.15.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.15.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.15.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.15.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.15.ffn_norm.weight
F32
F32
[5120]
blk.15.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.16
blk.16.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.16.attn_norm.weight
F32
F32
[5120]
blk.16.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.16.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.16.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.16.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.16.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.16.ffn_norm.weight
F32
F32
[5120]
blk.16.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.17
blk.17.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.17.attn_norm.weight
F32
F32
[5120]
blk.17.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.17.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.17.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.17.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.17.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.17.ffn_norm.weight
F32
F32
[5120]
blk.17.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.18
blk.18.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.18.attn_norm.weight
F32
F32
[5120]
blk.18.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.18.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.18.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.18.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.18.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.18.ffn_norm.weight
F32
F32
[5120]
blk.18.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.19
blk.19.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.19.attn_norm.weight
F32
F32
[5120]
blk.19.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.19.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.19.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.19.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.19.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.19.ffn_norm.weight
F32
F32
[5120]
blk.19.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.20
blk.20.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.20.attn_norm.weight
F32
F32
[5120]
blk.20.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.20.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.20.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.20.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.20.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.20.ffn_norm.weight
F32
F32
[5120]
blk.20.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.21
blk.21.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.21.attn_norm.weight
F32
F32
[5120]
blk.21.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.21.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.21.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.21.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.21.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.21.ffn_norm.weight
F32
F32
[5120]
blk.21.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.22
blk.22.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.22.attn_norm.weight
F32
F32
[5120]
blk.22.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.22.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.22.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.22.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.22.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.22.ffn_norm.weight
F32
F32
[5120]
blk.22.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.23
blk.23.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.23.attn_norm.weight
F32
F32
[5120]
blk.23.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.23.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.23.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.23.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.23.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.23.ffn_norm.weight
F32
F32
[5120]
blk.23.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.24
blk.24.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.24.attn_norm.weight
F32
F32
[5120]
blk.24.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.24.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.24.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.24.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.24.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.24.ffn_norm.weight
F32
F32
[5120]
blk.24.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.25
blk.25.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.25.attn_norm.weight
F32
F32
[5120]
blk.25.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.25.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.25.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.25.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.25.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.25.ffn_norm.weight
F32
F32
[5120]
blk.25.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.26
blk.26.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.26.attn_norm.weight
F32
F32
[5120]
blk.26.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.26.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.26.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.26.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.26.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.26.ffn_norm.weight
F32
F32
[5120]
blk.26.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.27
blk.27.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.27.attn_norm.weight
F32
F32
[5120]
blk.27.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.27.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.27.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.27.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.27.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.27.ffn_norm.weight
F32
F32
[5120]
blk.27.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.28
blk.28.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.28.attn_norm.weight
F32
F32
[5120]
blk.28.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.28.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.28.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.28.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.28.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.28.ffn_norm.weight
F32
F32
[5120]
blk.28.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.29
blk.29.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.29.attn_norm.weight
F32
F32
[5120]
blk.29.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.29.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.29.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.29.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.29.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.29.ffn_norm.weight
F32
F32
[5120]
blk.29.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.30
blk.30.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.30.attn_norm.weight
F32
F32
[5120]
blk.30.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.30.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.30.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.30.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.30.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.30.ffn_norm.weight
F32
F32
[5120]
blk.30.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.31
blk.31.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.31.attn_norm.weight
F32
F32
[5120]
blk.31.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.31.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.31.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.31.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.31.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.31.ffn_norm.weight
F32
F32
[5120]
blk.31.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.32
blk.32.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.32.attn_norm.weight
F32
F32
[5120]
blk.32.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.32.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.32.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.32.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.32.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.32.ffn_norm.weight
F32
F32
[5120]
blk.32.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.33
blk.33.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.33.attn_norm.weight
F32
F32
[5120]
blk.33.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.33.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.33.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.33.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.33.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.33.ffn_norm.weight
F32
F32
[5120]
blk.33.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.34
blk.34.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.34.attn_norm.weight
F32
F32
[5120]
blk.34.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.34.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.34.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.34.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.34.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.34.ffn_norm.weight
F32
F32
[5120]
blk.34.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.35
blk.35.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.35.attn_norm.weight
F32
F32
[5120]
blk.35.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.35.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.35.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.35.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.35.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.35.ffn_norm.weight
F32
F32
[5120]
blk.35.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.36
blk.36.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.36.attn_norm.weight
F32
F32
[5120]
blk.36.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.36.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.36.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.36.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.36.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.36.ffn_norm.weight
F32
F32
[5120]
blk.36.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.37
blk.37.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.37.attn_norm.weight
F32
F32
[5120]
blk.37.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.37.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.37.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.37.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.37.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.37.ffn_norm.weight
F32
F32
[5120]
blk.37.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.38
blk.38.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.38.attn_norm.weight
F32
F32
[5120]
blk.38.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.38.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.38.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.38.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.38.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.38.ffn_norm.weight
F32
F32
[5120]
blk.38.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.39
blk.39.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.39.attn_norm.weight
F32
F32
[5120]
blk.39.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.39.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.39.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.39.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.39.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.39.ffn_norm.weight
F32
F32
[5120]
blk.39.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.40
blk.40.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.40.attn_norm.weight
F32
F32
[5120]
blk.40.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.40.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.40.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.40.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.40.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.40.ffn_norm.weight
F32
F32
[5120]
blk.40.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.41
blk.41.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.41.attn_norm.weight
F32
F32
[5120]
blk.41.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.41.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.41.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.41.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.41.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.41.ffn_norm.weight
F32
F32
[5120]
blk.41.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.42
blk.42.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.42.attn_norm.weight
F32
F32
[5120]
blk.42.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.42.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.42.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.42.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.42.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.42.ffn_norm.weight
F32
F32
[5120]
blk.42.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.43
blk.43.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.43.attn_norm.weight
F32
F32
[5120]
blk.43.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.43.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.43.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.43.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.43.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.43.ffn_norm.weight
F32
F32
[5120]
blk.43.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.44
blk.44.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.44.attn_norm.weight
F32
F32
[5120]
blk.44.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.44.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.44.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.44.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.44.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.44.ffn_norm.weight
F32
F32
[5120]
blk.44.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.45
blk.45.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.45.attn_norm.weight
F32
F32
[5120]
blk.45.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.45.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.45.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.45.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.45.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.45.ffn_norm.weight
F32
F32
[5120]
blk.45.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.46
blk.46.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.46.attn_norm.weight
F32
F32
[5120]
blk.46.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.46.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.46.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.46.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.46.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.46.ffn_norm.weight
F32
F32
[5120]
blk.46.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.47
blk.47.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.47.attn_norm.weight
F32
F32
[5120]
blk.47.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.47.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.47.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.47.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.47.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.47.ffn_norm.weight
F32
F32
[5120]
blk.47.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.48
blk.48.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.48.attn_norm.weight
F32
F32
[5120]
blk.48.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.48.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.48.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.48.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.48.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.48.ffn_norm.weight
F32
F32
[5120]
blk.48.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.49
blk.49.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.49.attn_norm.weight
F32
F32
[5120]
blk.49.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.49.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.49.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.49.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.49.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.49.ffn_norm.weight
F32
F32
[5120]
blk.49.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.50
blk.50.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.50.attn_norm.weight
F32
F32
[5120]
blk.50.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.50.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.50.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.50.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.50.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.50.ffn_norm.weight
F32
F32
[5120]
blk.50.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.51
blk.51.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.51.attn_norm.weight
F32
F32
[5120]
blk.51.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.51.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.51.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.51.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.51.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.51.ffn_norm.weight
F32
F32
[5120]
blk.51.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.52
blk.52.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.52.attn_norm.weight
F32
F32
[5120]
blk.52.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.52.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.52.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.52.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.52.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.52.ffn_norm.weight
F32
F32
[5120]
blk.52.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.53
blk.53.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.53.attn_norm.weight
F32
F32
[5120]
blk.53.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.53.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.53.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.53.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.53.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.53.ffn_norm.weight
F32
F32
[5120]
blk.53.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.54
blk.54.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.54.attn_norm.weight
F32
F32
[5120]
blk.54.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.54.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.54.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.54.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.54.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.54.ffn_norm.weight
F32
F32
[5120]
blk.54.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.55
blk.55.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.55.attn_norm.weight
F32
F32
[5120]
blk.55.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.55.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.55.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.55.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.55.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.55.ffn_norm.weight
F32
F32
[5120]
blk.55.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.56
blk.56.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.56.attn_norm.weight
F32
F32
[5120]
blk.56.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.56.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.56.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.56.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.56.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.56.ffn_norm.weight
F32
F32
[5120]
blk.56.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.57
blk.57.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.57.attn_norm.weight
F32
F32
[5120]
blk.57.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.57.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.57.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.57.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.57.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.57.ffn_norm.weight
F32
F32
[5120]
blk.57.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.58
blk.58.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.58.attn_norm.weight
F32
F32
[5120]
blk.58.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.58.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.58.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.58.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.58.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.58.ffn_norm.weight
F32
F32
[5120]
blk.58.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.59
blk.59.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.59.attn_norm.weight
F32
F32
[5120]
blk.59.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.59.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.59.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.59.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.59.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.59.ffn_norm.weight
F32
F32
[5120]
blk.59.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.60
blk.60.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.60.attn_norm.weight
F32
F32
[5120]
blk.60.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.60.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.60.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.60.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.60.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.60.ffn_norm.weight
F32
F32
[5120]
blk.60.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.61
blk.61.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.61.attn_norm.weight
F32
F32
[5120]
blk.61.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.61.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.61.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.61.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.61.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.61.ffn_norm.weight
F32
F32
[5120]
blk.61.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.62
blk.62.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.62.attn_norm.weight
F32
F32
[5120]
blk.62.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.62.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.62.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.62.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.62.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.62.ffn_norm.weight
F32
F32
[5120]
blk.62.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
blk.63
blk.63.attn_k.weight
Q8_0
Q8_0
[5120, 1024]
blk.63.attn_norm.weight
F32
F32
[5120]
blk.63.attn_output.weight
Q8_0
Q8_0
[5120, 5120]
blk.63.attn_q.weight
Q8_0
Q8_0
[5120, 5120]
blk.63.attn_v.weight
Q8_0
Q8_0
[5120, 1024]
blk.63.ffn_down.weight
Q8_0
Q8_0
[27392, 5120]
blk.63.ffn_gate.weight
Q8_0
Q8_0
[5120, 27392]
blk.63.ffn_norm.weight
F32
F32
[5120]
blk.63.ffn_up.weight
Q8_0
Q8_0
[5120, 27392]
output.weight
Q8_0
Q8_0
[5120, 102400]
rope_freqs.weight
F32
F32
[64]
output_norm.weight
F32
F32
[5120]