latest
1.8GB
raspberry-3B by arcee-ai, GGUF file from QuantFactory/raspberry-3B-GGUF on hf. (This model have some weird problem, please don't use it in production.)
3B
5 Pulls Updated 5 days ago
61e76e8436ad · 1.8GB
-
general.architectureqwen2
-
general.file_typeQ4_0
-
qwen2.attention.head_count16
-
qwen2.attention.head_count_kv2
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count36
-
qwen2.context_length32768
-
qwen2.embedding_length2048
-
qwen2.feed_forward_length11008
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id151644
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ6_K[2048 151936]
-
blk.0.attn_norm.weightF32[2048]
-
blk.0.ffn_down.weightQ4_0[11008 2048]
-
blk.0.ffn_gate.weightQ4_0[2048 11008]
-
blk.0.ffn_up.weightQ4_0[2048 11008]
-
blk.0.ffn_norm.weightF32[2048]
-
blk.0.attn_k.biasF32[256]
-
blk.0.attn_k.weightQ4_0[2048 256]
-
blk.0.attn_output.weightQ4_0[2048 2048]
-
blk.0.attn_q.biasF32[2048]
-
blk.0.attn_q.weightQ4_0[2048 2048]
-
blk.0.attn_v.biasF32[256]
-
blk.0.attn_v.weightQ4_0[2048 256]
-
blk.1.attn_norm.weightF32[2048]
-
blk.1.ffn_down.weightQ4_0[11008 2048]
-
blk.1.ffn_gate.weightQ4_0[2048 11008]
-
blk.1.ffn_up.weightQ4_0[2048 11008]
-
blk.1.ffn_norm.weightF32[2048]
-
blk.1.attn_k.biasF32[256]
-
blk.1.attn_k.weightQ4_0[2048 256]
-
blk.1.attn_output.weightQ4_0[2048 2048]
-
blk.1.attn_q.biasF32[2048]
-
blk.1.attn_q.weightQ4_0[2048 2048]
-
blk.1.attn_v.biasF32[256]
-
blk.1.attn_v.weightQ4_0[2048 256]
-
blk.2.attn_norm.weightF32[2048]
-
blk.2.ffn_down.weightQ4_0[11008 2048]
-
blk.2.ffn_gate.weightQ4_0[2048 11008]
-
blk.2.ffn_up.weightQ4_0[2048 11008]
-
blk.2.ffn_norm.weightF32[2048]
-
blk.2.attn_k.biasF32[256]
-
blk.2.attn_k.weightQ4_0[2048 256]
-
blk.2.attn_output.weightQ4_0[2048 2048]
-
blk.2.attn_q.biasF32[2048]
-
blk.2.attn_q.weightQ4_0[2048 2048]
-
blk.2.attn_v.biasF32[256]
-
blk.2.attn_v.weightQ4_0[2048 256]
-
blk.3.attn_norm.weightF32[2048]
-
blk.3.ffn_down.weightQ4_0[11008 2048]
-
blk.3.ffn_gate.weightQ4_0[2048 11008]
-
blk.3.ffn_up.weightQ4_0[2048 11008]
-
blk.3.ffn_norm.weightF32[2048]
-
blk.3.attn_k.biasF32[256]
-
blk.3.attn_k.weightQ4_0[2048 256]
-
blk.3.attn_output.weightQ4_0[2048 2048]
-
blk.3.attn_q.biasF32[2048]
-
blk.3.attn_q.weightQ4_0[2048 2048]
-
blk.3.attn_v.biasF32[256]
-
blk.3.attn_v.weightQ4_0[2048 256]
-
blk.4.attn_norm.weightF32[2048]
-
blk.4.ffn_down.weightQ4_0[11008 2048]
-
blk.4.ffn_gate.weightQ4_0[2048 11008]
-
blk.4.ffn_up.weightQ4_0[2048 11008]
-
blk.4.ffn_norm.weightF32[2048]
-
blk.4.attn_k.biasF32[256]
-
blk.4.attn_k.weightQ4_0[2048 256]
-
blk.4.attn_output.weightQ4_0[2048 2048]
-
blk.4.attn_q.biasF32[2048]
-
blk.4.attn_q.weightQ4_0[2048 2048]
-
blk.4.attn_v.biasF32[256]
-
blk.4.attn_v.weightQ4_0[2048 256]
-
blk.5.attn_norm.weightF32[2048]
-
blk.5.ffn_down.weightQ4_0[11008 2048]
-
blk.5.ffn_gate.weightQ4_0[2048 11008]
-
blk.5.ffn_up.weightQ4_0[2048 11008]
-
blk.5.ffn_norm.weightF32[2048]
-
blk.5.attn_k.biasF32[256]
-
blk.5.attn_k.weightQ4_0[2048 256]
-
blk.5.attn_output.weightQ4_0[2048 2048]
-
blk.5.attn_q.biasF32[2048]
-
blk.5.attn_q.weightQ4_0[2048 2048]
-
blk.5.attn_v.biasF32[256]
-
blk.5.attn_v.weightQ4_0[2048 256]
-
blk.6.attn_norm.weightF32[2048]
-
blk.6.ffn_down.weightQ4_0[11008 2048]
-
blk.6.ffn_gate.weightQ4_0[2048 11008]
-
blk.6.ffn_up.weightQ4_0[2048 11008]
-
blk.6.ffn_norm.weightF32[2048]
-
blk.6.attn_k.biasF32[256]
-
blk.6.attn_k.weightQ4_0[2048 256]
-
blk.6.attn_output.weightQ4_0[2048 2048]
-
blk.6.attn_q.biasF32[2048]
-
blk.6.attn_q.weightQ4_0[2048 2048]
-
blk.6.attn_v.biasF32[256]
-
blk.6.attn_v.weightQ4_0[2048 256]
-
blk.7.attn_norm.weightF32[2048]
-
blk.7.ffn_down.weightQ4_0[11008 2048]
-
blk.7.ffn_gate.weightQ4_0[2048 11008]
-
blk.7.ffn_up.weightQ4_0[2048 11008]
-
blk.7.ffn_norm.weightF32[2048]
-
blk.7.attn_k.biasF32[256]
-
blk.7.attn_k.weightQ4_0[2048 256]
-
blk.7.attn_output.weightQ4_0[2048 2048]
-
blk.7.attn_q.biasF32[2048]
-
blk.7.attn_q.weightQ4_0[2048 2048]
-
blk.7.attn_v.biasF32[256]
-
blk.7.attn_v.weightQ4_0[2048 256]
-
blk.8.attn_norm.weightF32[2048]
-
blk.8.ffn_down.weightQ4_0[11008 2048]
-
blk.8.ffn_gate.weightQ4_0[2048 11008]
-
blk.8.ffn_up.weightQ4_0[2048 11008]
-
blk.8.ffn_norm.weightF32[2048]
-
blk.8.attn_k.biasF32[256]
-
blk.8.attn_k.weightQ4_0[2048 256]
-
blk.8.attn_output.weightQ4_0[2048 2048]
-
blk.8.attn_q.biasF32[2048]
-
blk.8.attn_q.weightQ4_0[2048 2048]
-
blk.8.attn_v.biasF32[256]
-
blk.8.attn_v.weightQ4_0[2048 256]
-
blk.9.attn_norm.weightF32[2048]
-
blk.9.ffn_down.weightQ4_0[11008 2048]
-
blk.9.ffn_gate.weightQ4_0[2048 11008]
-
blk.9.ffn_up.weightQ4_0[2048 11008]
-
blk.9.ffn_norm.weightF32[2048]
-
blk.9.attn_k.biasF32[256]
-
blk.9.attn_k.weightQ4_0[2048 256]
-
blk.9.attn_output.weightQ4_0[2048 2048]
-
blk.9.attn_q.biasF32[2048]
-
blk.9.attn_q.weightQ4_0[2048 2048]
-
blk.9.attn_v.biasF32[256]
-
blk.9.attn_v.weightQ4_0[2048 256]
-
blk.10.attn_norm.weightF32[2048]
-
blk.10.ffn_down.weightQ4_0[11008 2048]
-
blk.10.ffn_gate.weightQ4_0[2048 11008]
-
blk.10.ffn_up.weightQ4_0[2048 11008]
-
blk.10.ffn_norm.weightF32[2048]
-
blk.10.attn_k.biasF32[256]
-
blk.10.attn_k.weightQ4_0[2048 256]
-
blk.10.attn_output.weightQ4_0[2048 2048]
-
blk.10.attn_q.biasF32[2048]
-
blk.10.attn_q.weightQ4_0[2048 2048]
-
blk.10.attn_v.biasF32[256]
-
blk.10.attn_v.weightQ4_0[2048 256]
-
blk.11.attn_norm.weightF32[2048]
-
blk.11.ffn_down.weightQ4_0[11008 2048]
-
blk.11.ffn_gate.weightQ4_0[2048 11008]
-
blk.11.ffn_up.weightQ4_0[2048 11008]
-
blk.11.ffn_norm.weightF32[2048]
-
blk.11.attn_k.biasF32[256]
-
blk.11.attn_k.weightQ4_0[2048 256]
-
blk.11.attn_output.weightQ4_0[2048 2048]
-
blk.11.attn_q.biasF32[2048]
-
blk.11.attn_q.weightQ4_0[2048 2048]
-
blk.11.attn_v.biasF32[256]
-
blk.11.attn_v.weightQ4_0[2048 256]
-
blk.12.attn_norm.weightF32[2048]
-
blk.12.ffn_down.weightQ4_0[11008 2048]
-
blk.12.ffn_gate.weightQ4_0[2048 11008]
-
blk.12.ffn_up.weightQ4_0[2048 11008]
-
blk.12.ffn_norm.weightF32[2048]
-
blk.12.attn_k.biasF32[256]
-
blk.12.attn_k.weightQ4_0[2048 256]
-
blk.12.attn_output.weightQ4_0[2048 2048]
-
blk.12.attn_q.biasF32[2048]
-
blk.12.attn_q.weightQ4_0[2048 2048]
-
blk.12.attn_v.biasF32[256]
-
blk.12.attn_v.weightQ4_0[2048 256]
-
blk.13.attn_norm.weightF32[2048]
-
blk.13.ffn_down.weightQ4_0[11008 2048]
-
blk.13.ffn_gate.weightQ4_0[2048 11008]
-
blk.13.ffn_up.weightQ4_0[2048 11008]
-
blk.13.ffn_norm.weightF32[2048]
-
blk.13.attn_k.biasF32[256]
-
blk.13.attn_k.weightQ4_0[2048 256]
-
blk.13.attn_output.weightQ4_0[2048 2048]
-
blk.13.attn_q.biasF32[2048]
-
blk.13.attn_q.weightQ4_0[2048 2048]
-
blk.13.attn_v.biasF32[256]
-
blk.13.attn_v.weightQ4_0[2048 256]
-
blk.14.attn_norm.weightF32[2048]
-
blk.14.ffn_down.weightQ4_0[11008 2048]
-
blk.14.ffn_gate.weightQ4_0[2048 11008]
-
blk.14.ffn_up.weightQ4_0[2048 11008]
-
blk.14.ffn_norm.weightF32[2048]
-
blk.14.attn_k.biasF32[256]
-
blk.14.attn_k.weightQ4_0[2048 256]
-
blk.14.attn_output.weightQ4_0[2048 2048]
-
blk.14.attn_q.biasF32[2048]
-
blk.14.attn_q.weightQ4_0[2048 2048]
-
blk.14.attn_v.biasF32[256]
-
blk.14.attn_v.weightQ4_0[2048 256]
-
blk.15.attn_norm.weightF32[2048]
-
blk.15.ffn_down.weightQ4_0[11008 2048]
-
blk.15.ffn_gate.weightQ4_0[2048 11008]
-
blk.15.ffn_up.weightQ4_0[2048 11008]
-
blk.15.ffn_norm.weightF32[2048]
-
blk.15.attn_k.biasF32[256]
-
blk.15.attn_k.weightQ4_0[2048 256]
-
blk.15.attn_output.weightQ4_0[2048 2048]
-
blk.15.attn_q.biasF32[2048]
-
blk.15.attn_q.weightQ4_0[2048 2048]
-
blk.15.attn_v.biasF32[256]
-
blk.15.attn_v.weightQ4_0[2048 256]
-
blk.16.attn_norm.weightF32[2048]
-
blk.16.ffn_down.weightQ4_0[11008 2048]
-
blk.16.ffn_gate.weightQ4_0[2048 11008]
-
blk.16.ffn_up.weightQ4_0[2048 11008]
-
blk.16.ffn_norm.weightF32[2048]
-
blk.16.attn_k.biasF32[256]
-
blk.16.attn_k.weightQ4_0[2048 256]
-
blk.16.attn_output.weightQ4_0[2048 2048]
-
blk.16.attn_q.biasF32[2048]
-
blk.16.attn_q.weightQ4_0[2048 2048]
-
blk.16.attn_v.biasF32[256]
-
blk.16.attn_v.weightQ4_0[2048 256]
-
blk.17.attn_norm.weightF32[2048]
-
blk.17.ffn_down.weightQ4_0[11008 2048]
-
blk.17.ffn_gate.weightQ4_0[2048 11008]
-
blk.17.ffn_up.weightQ4_0[2048 11008]
-
blk.17.ffn_norm.weightF32[2048]
-
blk.17.attn_k.biasF32[256]
-
blk.17.attn_k.weightQ4_0[2048 256]
-
blk.17.attn_output.weightQ4_0[2048 2048]
-
blk.17.attn_q.biasF32[2048]
-
blk.17.attn_q.weightQ4_0[2048 2048]
-
blk.17.attn_v.biasF32[256]
-
blk.17.attn_v.weightQ4_0[2048 256]
-
blk.18.attn_norm.weightF32[2048]
-
blk.18.ffn_down.weightQ4_0[11008 2048]
-
blk.18.ffn_gate.weightQ4_0[2048 11008]
-
blk.18.ffn_up.weightQ4_0[2048 11008]
-
blk.18.ffn_norm.weightF32[2048]
-
blk.18.attn_k.biasF32[256]
-
blk.18.attn_k.weightQ4_0[2048 256]
-
blk.18.attn_output.weightQ4_0[2048 2048]
-
blk.18.attn_q.biasF32[2048]
-
blk.18.attn_q.weightQ4_0[2048 2048]
-
blk.18.attn_v.biasF32[256]
-
blk.18.attn_v.weightQ4_0[2048 256]
-
blk.19.attn_norm.weightF32[2048]
-
blk.19.ffn_down.weightQ4_0[11008 2048]
-
blk.19.ffn_gate.weightQ4_0[2048 11008]
-
blk.19.ffn_up.weightQ4_0[2048 11008]
-
blk.19.ffn_norm.weightF32[2048]
-
blk.19.attn_k.biasF32[256]
-
blk.19.attn_k.weightQ4_0[2048 256]
-
blk.19.attn_output.weightQ4_0[2048 2048]
-
blk.19.attn_q.biasF32[2048]
-
blk.19.attn_q.weightQ4_0[2048 2048]
-
blk.19.attn_v.biasF32[256]
-
blk.19.attn_v.weightQ4_0[2048 256]
-
blk.20.attn_norm.weightF32[2048]
-
blk.20.ffn_down.weightQ4_0[11008 2048]
-
blk.20.ffn_gate.weightQ4_0[2048 11008]
-
blk.20.ffn_up.weightQ4_0[2048 11008]
-
blk.20.ffn_norm.weightF32[2048]
-
blk.20.attn_k.biasF32[256]
-
blk.20.attn_k.weightQ4_0[2048 256]
-
blk.20.attn_output.weightQ4_0[2048 2048]
-
blk.20.attn_q.biasF32[2048]
-
blk.20.attn_q.weightQ4_0[2048 2048]
-
blk.20.attn_v.biasF32[256]
-
blk.20.attn_v.weightQ4_0[2048 256]
-
blk.21.attn_norm.weightF32[2048]
-
blk.21.ffn_down.weightQ4_0[11008 2048]
-
blk.21.ffn_gate.weightQ4_0[2048 11008]
-
blk.21.ffn_up.weightQ4_0[2048 11008]
-
blk.21.ffn_norm.weightF32[2048]
-
blk.21.attn_k.biasF32[256]
-
blk.21.attn_k.weightQ4_0[2048 256]
-
blk.21.attn_output.weightQ4_0[2048 2048]
-
blk.21.attn_q.biasF32[2048]
-
blk.21.attn_q.weightQ4_0[2048 2048]
-
blk.21.attn_v.biasF32[256]
-
blk.21.attn_v.weightQ4_0[2048 256]
-
blk.22.attn_norm.weightF32[2048]
-
blk.22.ffn_down.weightQ4_0[11008 2048]
-
blk.22.ffn_gate.weightQ4_0[2048 11008]
-
blk.22.ffn_up.weightQ4_0[2048 11008]
-
blk.22.ffn_norm.weightF32[2048]
-
blk.22.attn_k.biasF32[256]
-
blk.22.attn_k.weightQ4_0[2048 256]
-
blk.22.attn_output.weightQ4_0[2048 2048]
-
blk.22.attn_q.biasF32[2048]
-
blk.22.attn_q.weightQ4_0[2048 2048]
-
blk.22.attn_v.biasF32[256]
-
blk.22.attn_v.weightQ4_0[2048 256]
-
blk.23.attn_norm.weightF32[2048]
-
blk.23.ffn_down.weightQ4_0[11008 2048]
-
blk.23.ffn_gate.weightQ4_0[2048 11008]
-
blk.23.ffn_up.weightQ4_0[2048 11008]
-
blk.23.ffn_norm.weightF32[2048]
-
blk.23.attn_k.biasF32[256]
-
blk.23.attn_k.weightQ4_0[2048 256]
-
blk.23.attn_output.weightQ4_0[2048 2048]
-
blk.23.attn_q.biasF32[2048]
-
blk.23.attn_q.weightQ4_0[2048 2048]
-
blk.23.attn_v.biasF32[256]
-
blk.23.attn_v.weightQ4_0[2048 256]
-
blk.24.attn_norm.weightF32[2048]
-
blk.24.ffn_down.weightQ4_0[11008 2048]
-
blk.24.ffn_gate.weightQ4_0[2048 11008]
-
blk.24.ffn_up.weightQ4_0[2048 11008]
-
blk.24.ffn_norm.weightF32[2048]
-
blk.24.attn_k.biasF32[256]
-
blk.24.attn_k.weightQ4_0[2048 256]
-
blk.24.attn_output.weightQ4_0[2048 2048]
-
blk.24.attn_q.biasF32[2048]
-
blk.24.attn_q.weightQ4_0[2048 2048]
-
blk.24.attn_v.biasF32[256]
-
blk.24.attn_v.weightQ4_0[2048 256]
-
blk.25.attn_norm.weightF32[2048]
-
blk.25.ffn_down.weightQ4_0[11008 2048]
-
blk.25.ffn_gate.weightQ4_0[2048 11008]
-
blk.25.ffn_up.weightQ4_0[2048 11008]
-
blk.25.ffn_norm.weightF32[2048]
-
blk.25.attn_k.biasF32[256]
-
blk.25.attn_k.weightQ4_0[2048 256]
-
blk.25.attn_output.weightQ4_0[2048 2048]
-
blk.25.attn_q.biasF32[2048]
-
blk.25.attn_q.weightQ4_0[2048 2048]
-
blk.25.attn_v.biasF32[256]
-
blk.25.attn_v.weightQ4_0[2048 256]
-
blk.26.attn_norm.weightF32[2048]
-
blk.26.ffn_down.weightQ4_0[11008 2048]
-
blk.26.ffn_gate.weightQ4_0[2048 11008]
-
blk.26.ffn_up.weightQ4_0[2048 11008]
-
blk.26.ffn_norm.weightF32[2048]
-
blk.26.attn_k.biasF32[256]
-
blk.26.attn_k.weightQ4_0[2048 256]
-
blk.26.attn_output.weightQ4_0[2048 2048]
-
blk.26.attn_q.biasF32[2048]
-
blk.26.attn_q.weightQ4_0[2048 2048]
-
blk.26.attn_v.biasF32[256]
-
blk.26.attn_v.weightQ4_0[2048 256]
-
blk.27.attn_norm.weightF32[2048]
-
blk.27.ffn_down.weightQ4_0[11008 2048]
-
blk.27.ffn_gate.weightQ4_0[2048 11008]
-
blk.27.ffn_up.weightQ4_0[2048 11008]
-
blk.27.ffn_norm.weightF32[2048]
-
blk.27.attn_k.biasF32[256]
-
blk.27.attn_k.weightQ4_0[2048 256]
-
blk.27.attn_output.weightQ4_0[2048 2048]
-
blk.27.attn_q.biasF32[2048]
-
blk.27.attn_q.weightQ4_0[2048 2048]
-
blk.27.attn_v.biasF32[256]
-
blk.27.attn_v.weightQ4_0[2048 256]
-
blk.28.attn_k.biasF32[256]
-
blk.28.attn_k.weightQ4_0[2048 256]
-
blk.28.attn_output.weightQ4_0[2048 2048]
-
blk.28.attn_q.biasF32[2048]
-
blk.28.attn_q.weightQ4_0[2048 2048]
-
blk.28.attn_v.biasF32[256]
-
blk.28.attn_v.weightQ4_0[2048 256]
-
blk.28.attn_norm.weightF32[2048]
-
blk.28.ffn_down.weightQ4_0[11008 2048]
-
blk.28.ffn_gate.weightQ4_0[2048 11008]
-
blk.28.ffn_up.weightQ4_0[2048 11008]
-
blk.28.ffn_norm.weightF32[2048]
-
blk.29.attn_norm.weightF32[2048]
-
blk.29.ffn_down.weightQ4_0[11008 2048]
-
blk.29.ffn_gate.weightQ4_0[2048 11008]
-
blk.29.ffn_up.weightQ4_0[2048 11008]
-
blk.29.ffn_norm.weightF32[2048]
-
blk.29.attn_k.biasF32[256]
-
blk.29.attn_k.weightQ4_0[2048 256]
-
blk.29.attn_output.weightQ4_0[2048 2048]
-
blk.29.attn_q.biasF32[2048]
-
blk.29.attn_q.weightQ4_0[2048 2048]
-
blk.29.attn_v.biasF32[256]
-
blk.29.attn_v.weightQ4_0[2048 256]
-
blk.30.attn_norm.weightF32[2048]
-
blk.30.ffn_down.weightQ4_0[11008 2048]
-
blk.30.ffn_gate.weightQ4_0[2048 11008]
-
blk.30.ffn_up.weightQ4_0[2048 11008]
-
blk.30.ffn_norm.weightF32[2048]
-
blk.30.attn_k.biasF32[256]
-
blk.30.attn_k.weightQ4_0[2048 256]
-
blk.30.attn_output.weightQ4_0[2048 2048]
-
blk.30.attn_q.biasF32[2048]
-
blk.30.attn_q.weightQ4_0[2048 2048]
-
blk.30.attn_v.biasF32[256]
-
blk.30.attn_v.weightQ4_0[2048 256]
-
blk.31.attn_norm.weightF32[2048]
-
blk.31.ffn_down.weightQ4_0[11008 2048]
-
blk.31.ffn_gate.weightQ4_0[2048 11008]
-
blk.31.ffn_up.weightQ4_0[2048 11008]
-
blk.31.ffn_norm.weightF32[2048]
-
blk.31.attn_k.biasF32[256]
-
blk.31.attn_k.weightQ4_0[2048 256]
-
blk.31.attn_output.weightQ4_0[2048 2048]
-
blk.31.attn_q.biasF32[2048]
-
blk.31.attn_q.weightQ4_0[2048 2048]
-
blk.31.attn_v.biasF32[256]
-
blk.31.attn_v.weightQ4_0[2048 256]
-
blk.32.attn_norm.weightF32[2048]
-
blk.32.ffn_down.weightQ4_0[11008 2048]
-
blk.32.ffn_gate.weightQ4_0[2048 11008]
-
blk.32.ffn_up.weightQ4_0[2048 11008]
-
blk.32.ffn_norm.weightF32[2048]
-
blk.32.attn_k.biasF32[256]
-
blk.32.attn_k.weightQ4_0[2048 256]
-
blk.32.attn_output.weightQ4_0[2048 2048]
-
blk.32.attn_q.biasF32[2048]
-
blk.32.attn_q.weightQ4_0[2048 2048]
-
blk.32.attn_v.biasF32[256]
-
blk.32.attn_v.weightQ4_0[2048 256]
-
blk.33.attn_norm.weightF32[2048]
-
blk.33.ffn_down.weightQ4_0[11008 2048]
-
blk.33.ffn_gate.weightQ4_0[2048 11008]
-
blk.33.ffn_up.weightQ4_0[2048 11008]
-
blk.33.ffn_norm.weightF32[2048]
-
blk.33.attn_k.biasF32[256]
-
blk.33.attn_k.weightQ4_0[2048 256]
-
blk.33.attn_output.weightQ4_0[2048 2048]
-
blk.33.attn_q.biasF32[2048]
-
blk.33.attn_q.weightQ4_0[2048 2048]
-
blk.33.attn_v.biasF32[256]
-
blk.33.attn_v.weightQ4_0[2048 256]
-
blk.34.attn_norm.weightF32[2048]
-
blk.34.ffn_down.weightQ4_0[11008 2048]
-
blk.34.ffn_gate.weightQ4_0[2048 11008]
-
blk.34.ffn_up.weightQ4_0[2048 11008]
-
blk.34.ffn_norm.weightF32[2048]
-
blk.34.attn_k.biasF32[256]
-
blk.34.attn_k.weightQ4_0[2048 256]
-
blk.34.attn_output.weightQ4_0[2048 2048]
-
blk.34.attn_q.biasF32[2048]
-
blk.34.attn_q.weightQ4_0[2048 2048]
-
blk.34.attn_v.biasF32[256]
-
blk.34.attn_v.weightQ4_0[2048 256]
-
blk.35.attn_norm.weightF32[2048]
-
blk.35.ffn_down.weightQ4_0[11008 2048]
-
blk.35.ffn_gate.weightQ4_0[2048 11008]
-
blk.35.ffn_up.weightQ4_0[2048 11008]
-
blk.35.ffn_norm.weightF32[2048]
-
blk.35.attn_k.biasF32[256]
-
blk.35.attn_k.weightQ4_0[2048 256]
-
blk.35.attn_output.weightQ4_0[2048 2048]
-
blk.35.attn_q.biasF32[2048]
-
blk.35.attn_q.weightQ4_0[2048 2048]
-
blk.35.attn_v.biasF32[256]
-
blk.35.attn_v.weightQ4_0[2048 256]
-
output_norm.weightF32[2048]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35