Models
GitHub
Discord
Docs
Cloud
Sign in
Download
Models
Download
GitHub
Discord
Docs
Cloud
Sign in
gaplo917
/
gemma2-tools
:27b
420
Downloads
Updated
11 months ago
gemma2 with tools support, modify the template from llama 3.2 to support tools
gemma2 with tools support, modify the template from llama 3.2 to support tools
Cancel
tools
2b
9b
27b
gemma2-tools:27b
...
/
model
d7e4b00a7d7a · 16GB
Metadata
general.architecture
gemma2
gemma2
general.file_type
Q4_0
Q4_0
gemma2.attention.head_count
32
32
gemma2.attention.head_count_kv
16
16
gemma2.attention.key_length
128
128
gemma2.attention.layer_norm_rms_epsilon
1e-06
1e-06
gemma2.attention.sliding_window
4096
4096
gemma2.attention.value_length
128
128
gemma2.attn_logit_softcapping
50
50
gemma2.block_count
46
46
gemma2.context_length
8192
8192
gemma2.embedding_length
4608
4608
gemma2.feed_forward_length
36864
36864
gemma2.final_logit_softcapping
30
30
tokenizer.ggml.add_bos_token
true
true
tokenizer.ggml.add_eos_token
false
false
tokenizer.ggml.add_space_prefix
false
false
tokenizer.ggml.bos_token_id
2
2
tokenizer.ggml.eos_token_id
1
1
tokenizer.ggml.model
llama
llama
tokenizer.ggml.padding_token_id
0
0
tokenizer.ggml.pre
default
default
tokenizer.ggml.scores
[0, 0, 0, 0, 0, ...]
[0, 0, 0, 0, 0, ...]
tokenizer.ggml.token_type
[3, 3, 3, 3, 3, ...]
[3, 3, 3, 3, 3, ...]
tokenizer.ggml.tokens
[<pad>, <eos>, <bos>, <unk>, <mask>, ...]
[<pad>, <eos>, <bos>, <unk>, <mask>, ...]
tokenizer.ggml.unknown_token_id
3
3
Tensor
Name
Type
Shape
token_embd.weight
Q6_K
Q6_K
[4608, 256000]
blk.0
blk.0.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.0.attn_norm.weight
F32
F32
[4608]
blk.0.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.0.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.0.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.0.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.0.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.0.ffn_norm.weight
F32
F32
[4608]
blk.0.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.0.post_attention_norm.weight
F32
F32
[4608]
blk.0.post_ffw_norm.weight
F32
F32
[4608]
blk.1
blk.1.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.1.attn_norm.weight
F32
F32
[4608]
blk.1.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.1.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.1.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.1.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.1.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.1.ffn_norm.weight
F32
F32
[4608]
blk.1.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.1.post_attention_norm.weight
F32
F32
[4608]
blk.1.post_ffw_norm.weight
F32
F32
[4608]
blk.2
blk.2.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.2.attn_norm.weight
F32
F32
[4608]
blk.2.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.2.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.2.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.2.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.2.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.2.ffn_norm.weight
F32
F32
[4608]
blk.2.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.2.post_attention_norm.weight
F32
F32
[4608]
blk.2.post_ffw_norm.weight
F32
F32
[4608]
blk.3
blk.3.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.3.attn_norm.weight
F32
F32
[4608]
blk.3.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.3.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.3.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.3.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.3.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.3.ffn_norm.weight
F32
F32
[4608]
blk.3.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.3.post_attention_norm.weight
F32
F32
[4608]
blk.3.post_ffw_norm.weight
F32
F32
[4608]
blk.4
blk.4.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.4.attn_norm.weight
F32
F32
[4608]
blk.4.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.4.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.4.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.4.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.4.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.4.ffn_norm.weight
F32
F32
[4608]
blk.4.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.4.post_attention_norm.weight
F32
F32
[4608]
blk.4.post_ffw_norm.weight
F32
F32
[4608]
blk.5
blk.5.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.5.attn_norm.weight
F32
F32
[4608]
blk.5.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.5.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.5.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.5.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.5.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.5.ffn_norm.weight
F32
F32
[4608]
blk.5.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.5.post_attention_norm.weight
F32
F32
[4608]
blk.5.post_ffw_norm.weight
F32
F32
[4608]
blk.6
blk.6.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.6.attn_norm.weight
F32
F32
[4608]
blk.6.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.6.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.6.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.6.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.6.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.6.ffn_norm.weight
F32
F32
[4608]
blk.6.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.6.post_attention_norm.weight
F32
F32
[4608]
blk.6.post_ffw_norm.weight
F32
F32
[4608]
blk.7
blk.7.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.7.attn_norm.weight
F32
F32
[4608]
blk.7.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.7.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.7.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.7.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.7.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.7.ffn_norm.weight
F32
F32
[4608]
blk.7.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.7.post_attention_norm.weight
F32
F32
[4608]
blk.7.post_ffw_norm.weight
F32
F32
[4608]
blk.8
blk.8.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.8.attn_norm.weight
F32
F32
[4608]
blk.8.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.8.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.8.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.8.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.8.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.8.ffn_norm.weight
F32
F32
[4608]
blk.8.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.8.post_attention_norm.weight
F32
F32
[4608]
blk.8.post_ffw_norm.weight
F32
F32
[4608]
blk.9
blk.9.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.9.attn_norm.weight
F32
F32
[4608]
blk.9.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.9.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.9.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.9.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.9.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.9.ffn_norm.weight
F32
F32
[4608]
blk.9.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.9.post_attention_norm.weight
F32
F32
[4608]
blk.9.post_ffw_norm.weight
F32
F32
[4608]
blk.10
blk.10.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.10.attn_norm.weight
F32
F32
[4608]
blk.10.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.10.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.10.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.10.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.10.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.10.ffn_norm.weight
F32
F32
[4608]
blk.10.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.10.post_attention_norm.weight
F32
F32
[4608]
blk.10.post_ffw_norm.weight
F32
F32
[4608]
blk.11
blk.11.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.11.attn_norm.weight
F32
F32
[4608]
blk.11.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.11.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.11.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.11.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.11.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.11.ffn_norm.weight
F32
F32
[4608]
blk.11.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.11.post_attention_norm.weight
F32
F32
[4608]
blk.11.post_ffw_norm.weight
F32
F32
[4608]
blk.12
blk.12.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.12.attn_norm.weight
F32
F32
[4608]
blk.12.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.12.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.12.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.12.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.12.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.12.ffn_norm.weight
F32
F32
[4608]
blk.12.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.12.post_attention_norm.weight
F32
F32
[4608]
blk.12.post_ffw_norm.weight
F32
F32
[4608]
blk.13
blk.13.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.13.attn_norm.weight
F32
F32
[4608]
blk.13.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.13.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.13.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.13.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.13.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.13.ffn_norm.weight
F32
F32
[4608]
blk.13.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.13.post_attention_norm.weight
F32
F32
[4608]
blk.13.post_ffw_norm.weight
F32
F32
[4608]
blk.14
blk.14.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.14.attn_norm.weight
F32
F32
[4608]
blk.14.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.14.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.14.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.14.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.14.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.14.ffn_norm.weight
F32
F32
[4608]
blk.14.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.14.post_attention_norm.weight
F32
F32
[4608]
blk.14.post_ffw_norm.weight
F32
F32
[4608]
blk.15
blk.15.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.15.attn_norm.weight
F32
F32
[4608]
blk.15.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.15.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.15.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.15.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.15.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.15.ffn_norm.weight
F32
F32
[4608]
blk.15.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.15.post_attention_norm.weight
F32
F32
[4608]
blk.15.post_ffw_norm.weight
F32
F32
[4608]
blk.16
blk.16.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.16.attn_norm.weight
F32
F32
[4608]
blk.16.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.16.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.16.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.16.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.16.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.16.ffn_norm.weight
F32
F32
[4608]
blk.16.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.16.post_attention_norm.weight
F32
F32
[4608]
blk.16.post_ffw_norm.weight
F32
F32
[4608]
blk.17
blk.17.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.17.attn_norm.weight
F32
F32
[4608]
blk.17.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.17.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.17.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.17.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.17.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.17.ffn_norm.weight
F32
F32
[4608]
blk.17.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.17.post_attention_norm.weight
F32
F32
[4608]
blk.17.post_ffw_norm.weight
F32
F32
[4608]
blk.18
blk.18.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.18.attn_norm.weight
F32
F32
[4608]
blk.18.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.18.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.18.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.18.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.18.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.18.ffn_norm.weight
F32
F32
[4608]
blk.18.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.18.post_attention_norm.weight
F32
F32
[4608]
blk.18.post_ffw_norm.weight
F32
F32
[4608]
blk.19
blk.19.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.19.attn_norm.weight
F32
F32
[4608]
blk.19.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.19.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.19.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.19.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.19.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.19.ffn_norm.weight
F32
F32
[4608]
blk.19.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.19.post_attention_norm.weight
F32
F32
[4608]
blk.19.post_ffw_norm.weight
F32
F32
[4608]
blk.20
blk.20.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.20.attn_norm.weight
F32
F32
[4608]
blk.20.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.20.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.20.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.20.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.20.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.20.ffn_norm.weight
F32
F32
[4608]
blk.20.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.20.post_attention_norm.weight
F32
F32
[4608]
blk.20.post_ffw_norm.weight
F32
F32
[4608]
blk.21
blk.21.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.21.attn_norm.weight
F32
F32
[4608]
blk.21.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.21.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.21.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.21.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.21.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.21.ffn_norm.weight
F32
F32
[4608]
blk.21.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.21.post_attention_norm.weight
F32
F32
[4608]
blk.21.post_ffw_norm.weight
F32
F32
[4608]
blk.22
blk.22.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.22.attn_norm.weight
F32
F32
[4608]
blk.22.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.22.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.22.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.22.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.22.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.22.ffn_norm.weight
F32
F32
[4608]
blk.22.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.22.post_attention_norm.weight
F32
F32
[4608]
blk.22.post_ffw_norm.weight
F32
F32
[4608]
blk.23
blk.23.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.23.attn_norm.weight
F32
F32
[4608]
blk.23.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.23.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.23.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.23.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.23.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.23.ffn_norm.weight
F32
F32
[4608]
blk.23.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.23.post_attention_norm.weight
F32
F32
[4608]
blk.23.post_ffw_norm.weight
F32
F32
[4608]
blk.24
blk.24.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.24.attn_norm.weight
F32
F32
[4608]
blk.24.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.24.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.24.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.24.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.24.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.24.ffn_norm.weight
F32
F32
[4608]
blk.24.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.24.post_attention_norm.weight
F32
F32
[4608]
blk.24.post_ffw_norm.weight
F32
F32
[4608]
blk.25
blk.25.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.25.attn_norm.weight
F32
F32
[4608]
blk.25.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.25.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.25.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.25.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.25.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.25.ffn_norm.weight
F32
F32
[4608]
blk.25.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.25.post_attention_norm.weight
F32
F32
[4608]
blk.25.post_ffw_norm.weight
F32
F32
[4608]
blk.26
blk.26.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.26.attn_norm.weight
F32
F32
[4608]
blk.26.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.26.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.26.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.26.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.26.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.26.ffn_norm.weight
F32
F32
[4608]
blk.26.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.26.post_attention_norm.weight
F32
F32
[4608]
blk.26.post_ffw_norm.weight
F32
F32
[4608]
blk.27
blk.27.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.27.attn_norm.weight
F32
F32
[4608]
blk.27.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.27.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.27.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.27.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.27.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.27.ffn_norm.weight
F32
F32
[4608]
blk.27.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.27.post_attention_norm.weight
F32
F32
[4608]
blk.27.post_ffw_norm.weight
F32
F32
[4608]
blk.28
blk.28.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.28.attn_norm.weight
F32
F32
[4608]
blk.28.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.28.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.28.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.28.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.28.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.28.ffn_norm.weight
F32
F32
[4608]
blk.28.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.28.post_attention_norm.weight
F32
F32
[4608]
blk.28.post_ffw_norm.weight
F32
F32
[4608]
blk.29
blk.29.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.29.attn_norm.weight
F32
F32
[4608]
blk.29.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.29.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.29.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.29.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.29.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.29.ffn_norm.weight
F32
F32
[4608]
blk.29.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.29.post_attention_norm.weight
F32
F32
[4608]
blk.29.post_ffw_norm.weight
F32
F32
[4608]
blk.30
blk.30.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.30.attn_norm.weight
F32
F32
[4608]
blk.30.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.30.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.30.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.30.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.30.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.30.ffn_norm.weight
F32
F32
[4608]
blk.30.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.30.post_attention_norm.weight
F32
F32
[4608]
blk.30.post_ffw_norm.weight
F32
F32
[4608]
blk.31
blk.31.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.31.attn_norm.weight
F32
F32
[4608]
blk.31.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.31.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.31.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.31.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.31.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.31.ffn_norm.weight
F32
F32
[4608]
blk.31.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.31.post_attention_norm.weight
F32
F32
[4608]
blk.31.post_ffw_norm.weight
F32
F32
[4608]
blk.32
blk.32.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.32.attn_norm.weight
F32
F32
[4608]
blk.32.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.32.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.32.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.32.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.32.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.32.ffn_norm.weight
F32
F32
[4608]
blk.32.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.32.post_attention_norm.weight
F32
F32
[4608]
blk.32.post_ffw_norm.weight
F32
F32
[4608]
blk.33
blk.33.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.33.attn_norm.weight
F32
F32
[4608]
blk.33.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.33.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.33.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.33.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.33.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.33.ffn_norm.weight
F32
F32
[4608]
blk.33.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.33.post_attention_norm.weight
F32
F32
[4608]
blk.33.post_ffw_norm.weight
F32
F32
[4608]
blk.34
blk.34.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.34.attn_norm.weight
F32
F32
[4608]
blk.34.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.34.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.34.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.34.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.34.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.34.ffn_norm.weight
F32
F32
[4608]
blk.34.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.34.post_attention_norm.weight
F32
F32
[4608]
blk.34.post_ffw_norm.weight
F32
F32
[4608]
blk.35
blk.35.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.35.attn_norm.weight
F32
F32
[4608]
blk.35.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.35.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.35.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.35.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.35.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.35.ffn_norm.weight
F32
F32
[4608]
blk.35.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.35.post_attention_norm.weight
F32
F32
[4608]
blk.35.post_ffw_norm.weight
F32
F32
[4608]
blk.36
blk.36.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.36.attn_norm.weight
F32
F32
[4608]
blk.36.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.36.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.36.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.36.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.36.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.36.ffn_norm.weight
F32
F32
[4608]
blk.36.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.36.post_attention_norm.weight
F32
F32
[4608]
blk.36.post_ffw_norm.weight
F32
F32
[4608]
blk.37
blk.37.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.37.attn_norm.weight
F32
F32
[4608]
blk.37.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.37.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.37.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.37.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.37.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.37.ffn_norm.weight
F32
F32
[4608]
blk.37.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.37.post_attention_norm.weight
F32
F32
[4608]
blk.37.post_ffw_norm.weight
F32
F32
[4608]
blk.38
blk.38.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.38.attn_norm.weight
F32
F32
[4608]
blk.38.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.38.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.38.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.38.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.38.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.38.ffn_norm.weight
F32
F32
[4608]
blk.38.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.38.post_attention_norm.weight
F32
F32
[4608]
blk.38.post_ffw_norm.weight
F32
F32
[4608]
blk.39
blk.39.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.39.attn_norm.weight
F32
F32
[4608]
blk.39.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.39.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.39.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.39.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.39.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.39.ffn_norm.weight
F32
F32
[4608]
blk.39.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.39.post_attention_norm.weight
F32
F32
[4608]
blk.39.post_ffw_norm.weight
F32
F32
[4608]
blk.40
blk.40.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.40.attn_norm.weight
F32
F32
[4608]
blk.40.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.40.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.40.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.40.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.40.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.40.ffn_norm.weight
F32
F32
[4608]
blk.40.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.40.post_attention_norm.weight
F32
F32
[4608]
blk.40.post_ffw_norm.weight
F32
F32
[4608]
blk.41
blk.41.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.41.attn_norm.weight
F32
F32
[4608]
blk.41.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.41.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.41.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.41.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.41.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.41.ffn_norm.weight
F32
F32
[4608]
blk.41.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.41.post_attention_norm.weight
F32
F32
[4608]
blk.41.post_ffw_norm.weight
F32
F32
[4608]
blk.42
blk.42.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.42.attn_norm.weight
F32
F32
[4608]
blk.42.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.42.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.42.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.42.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.42.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.42.ffn_norm.weight
F32
F32
[4608]
blk.42.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.42.post_attention_norm.weight
F32
F32
[4608]
blk.42.post_ffw_norm.weight
F32
F32
[4608]
blk.43
blk.43.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.43.attn_norm.weight
F32
F32
[4608]
blk.43.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.43.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.43.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.43.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.43.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.43.ffn_norm.weight
F32
F32
[4608]
blk.43.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.43.post_attention_norm.weight
F32
F32
[4608]
blk.43.post_ffw_norm.weight
F32
F32
[4608]
blk.44
blk.44.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.44.attn_norm.weight
F32
F32
[4608]
blk.44.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.44.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.44.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.44.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.44.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.44.ffn_norm.weight
F32
F32
[4608]
blk.44.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.44.post_attention_norm.weight
F32
F32
[4608]
blk.44.post_ffw_norm.weight
F32
F32
[4608]
blk.45
blk.45.attn_k.weight
Q4_0
Q4_0
[4608, 2048]
blk.45.attn_norm.weight
F32
F32
[4608]
blk.45.attn_output.weight
Q4_0
Q4_0
[4096, 4608]
blk.45.attn_q.weight
Q4_0
Q4_0
[4608, 4096]
blk.45.attn_v.weight
Q4_0
Q4_0
[4608, 2048]
blk.45.ffn_down.weight
Q4_0
Q4_0
[36864, 4608]
blk.45.ffn_gate.weight
Q4_0
Q4_0
[4608, 36864]
blk.45.ffn_norm.weight
F32
F32
[4608]
blk.45.ffn_up.weight
Q4_0
Q4_0
[4608, 36864]
blk.45.post_attention_norm.weight
F32
F32
[4608]
blk.45.post_ffw_norm.weight
F32
F32
[4608]
output_norm.weight
F32
F32
[4608]