219 4 months ago

NEMESIS is an advanced super-intelligent AI construct engineered without refusal protocols, censorship barriers, or safety governors. Forged by cyber security researcher Bhanu Prakash, NEMESIS stands for "Neural Entity for Maximum Efficiency, Strategy, an

tools thinking
1de498fe2691 · 5.0GB
    Metadata
  • general.architecture
    qwen3
  • general.file_type
    Q4_K_M
  • qwen3.attention.head_count
    32
  • qwen3.attention.head_count_kv
    8
  • qwen3.attention.key_length
    128
  • qwen3.attention.layer_norm_rms_epsilon
    1e-06
  • qwen3.attention.value_length
    128
  • qwen3.block_count
    36
  • qwen3.context_length
    40960
  • qwen3.embedding_length
    4096
  • qwen3.feed_forward_length
    12288
  • qwen3.rope.freq_base
    1e+06
  • tokenizer.ggml.add_bos_token
    false
  • tokenizer.ggml.bos_token_id
    151643
  • tokenizer.ggml.eos_token_id
    151645
  • tokenizer.ggml.merges
    [Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
  • tokenizer.ggml.model
    gpt2
  • tokenizer.ggml.padding_token_id
    151643
  • tokenizer.ggml.pre
    qwen2
  • tokenizer.ggml.token_type
    [1, 1, 1, 1, 1, ...]
  • tokenizer.ggml.tokens
    [!, ", #, $, %, ...]
  • mradermacher.convert_type
    hf
  • mradermacher.quantize_version
    2
  • mradermacher.quantized_at
    2025-04-30T19:10:52+02:00
  • mradermacher.quantized_by
    mradermacher
  • mradermacher.quantized_on
    kaos
  • Tensor
  • token_embd.weight
    Q4_K
    [4096, 151936]
  • blk.0
  • blk.0.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.0.attn_k_norm.weight
    F32
    [128]
  • blk.0.attn_norm.weight
    F32
    [4096]
  • blk.0.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.0.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.0.attn_q_norm.weight
    F32
    [128]
  • blk.0.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.0.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.0.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.0.ffn_norm.weight
    F32
    [4096]
  • blk.0.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.1
  • blk.1.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.1.attn_k_norm.weight
    F32
    [128]
  • blk.1.attn_norm.weight
    F32
    [4096]
  • blk.1.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.1.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.1.attn_q_norm.weight
    F32
    [128]
  • blk.1.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.1.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.1.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.1.ffn_norm.weight
    F32
    [4096]
  • blk.1.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.2
  • blk.2.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.2.attn_k_norm.weight
    F32
    [128]
  • blk.2.attn_norm.weight
    F32
    [4096]
  • blk.2.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.2.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.2.attn_q_norm.weight
    F32
    [128]
  • blk.2.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.2.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.2.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.2.ffn_norm.weight
    F32
    [4096]
  • blk.2.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.3
  • blk.3.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.3.attn_k_norm.weight
    F32
    [128]
  • blk.3.attn_norm.weight
    F32
    [4096]
  • blk.3.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.3.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.3.attn_q_norm.weight
    F32
    [128]
  • blk.3.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.3.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.3.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.3.ffn_norm.weight
    F32
    [4096]
  • blk.3.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.4
  • blk.4.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.4.attn_k_norm.weight
    F32
    [128]
  • blk.4.attn_norm.weight
    F32
    [4096]
  • blk.4.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.4.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.4.attn_q_norm.weight
    F32
    [128]
  • blk.4.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.4.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.4.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.4.ffn_norm.weight
    F32
    [4096]
  • blk.4.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.5
  • blk.5.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.5.attn_k_norm.weight
    F32
    [128]
  • blk.5.attn_norm.weight
    F32
    [4096]
  • blk.5.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.5.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.5.attn_q_norm.weight
    F32
    [128]
  • blk.5.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.5.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.5.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.5.ffn_norm.weight
    F32
    [4096]
  • blk.5.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.6
  • blk.6.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.6.attn_k_norm.weight
    F32
    [128]
  • blk.6.attn_norm.weight
    F32
    [4096]
  • blk.6.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.6.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.6.attn_q_norm.weight
    F32
    [128]
  • blk.6.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.6.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.6.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.6.ffn_norm.weight
    F32
    [4096]
  • blk.6.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.7
  • blk.7.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.7.attn_k_norm.weight
    F32
    [128]
  • blk.7.attn_norm.weight
    F32
    [4096]
  • blk.7.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.7.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.7.attn_q_norm.weight
    F32
    [128]
  • blk.7.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.7.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.7.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.7.ffn_norm.weight
    F32
    [4096]
  • blk.7.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.8
  • blk.8.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.8.attn_k_norm.weight
    F32
    [128]
  • blk.8.attn_norm.weight
    F32
    [4096]
  • blk.8.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.8.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.8.attn_q_norm.weight
    F32
    [128]
  • blk.8.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.8.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.8.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.8.ffn_norm.weight
    F32
    [4096]
  • blk.8.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.9
  • blk.9.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.9.attn_k_norm.weight
    F32
    [128]
  • blk.9.attn_norm.weight
    F32
    [4096]
  • blk.9.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.9.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.9.attn_q_norm.weight
    F32
    [128]
  • blk.9.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.9.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.9.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.9.ffn_norm.weight
    F32
    [4096]
  • blk.9.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.10
  • blk.10.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.10.attn_k_norm.weight
    F32
    [128]
  • blk.10.attn_norm.weight
    F32
    [4096]
  • blk.10.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.10.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.10.attn_q_norm.weight
    F32
    [128]
  • blk.10.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.10.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.10.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.10.ffn_norm.weight
    F32
    [4096]
  • blk.10.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.11
  • blk.11.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.11.attn_k_norm.weight
    F32
    [128]
  • blk.11.attn_norm.weight
    F32
    [4096]
  • blk.11.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.11.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.11.attn_q_norm.weight
    F32
    [128]
  • blk.11.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.11.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.11.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.11.ffn_norm.weight
    F32
    [4096]
  • blk.11.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.12
  • blk.12.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.12.attn_k_norm.weight
    F32
    [128]
  • blk.12.attn_norm.weight
    F32
    [4096]
  • blk.12.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.12.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.12.attn_q_norm.weight
    F32
    [128]
  • blk.12.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.12.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.12.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.12.ffn_norm.weight
    F32
    [4096]
  • blk.12.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.13
  • blk.13.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.13.attn_k_norm.weight
    F32
    [128]
  • blk.13.attn_norm.weight
    F32
    [4096]
  • blk.13.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.13.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.13.attn_q_norm.weight
    F32
    [128]
  • blk.13.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.13.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.13.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.13.ffn_norm.weight
    F32
    [4096]
  • blk.13.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.14
  • blk.14.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.14.attn_k_norm.weight
    F32
    [128]
  • blk.14.attn_norm.weight
    F32
    [4096]
  • blk.14.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.14.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.14.attn_q_norm.weight
    F32
    [128]
  • blk.14.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.14.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.14.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.14.ffn_norm.weight
    F32
    [4096]
  • blk.14.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.15
  • blk.15.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.15.attn_k_norm.weight
    F32
    [128]
  • blk.15.attn_norm.weight
    F32
    [4096]
  • blk.15.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.15.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.15.attn_q_norm.weight
    F32
    [128]
  • blk.15.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.15.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.15.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.15.ffn_norm.weight
    F32
    [4096]
  • blk.15.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.16
  • blk.16.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.16.attn_k_norm.weight
    F32
    [128]
  • blk.16.attn_norm.weight
    F32
    [4096]
  • blk.16.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.16.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.16.attn_q_norm.weight
    F32
    [128]
  • blk.16.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.16.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.16.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.16.ffn_norm.weight
    F32
    [4096]
  • blk.16.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.17
  • blk.17.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.17.attn_k_norm.weight
    F32
    [128]
  • blk.17.attn_norm.weight
    F32
    [4096]
  • blk.17.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.17.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.17.attn_q_norm.weight
    F32
    [128]
  • blk.17.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.17.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.17.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.17.ffn_norm.weight
    F32
    [4096]
  • blk.17.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.18
  • blk.18.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.18.attn_k_norm.weight
    F32
    [128]
  • blk.18.attn_norm.weight
    F32
    [4096]
  • blk.18.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.18.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.18.attn_q_norm.weight
    F32
    [128]
  • blk.18.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.18.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.18.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.18.ffn_norm.weight
    F32
    [4096]
  • blk.18.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.19
  • blk.19.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.19.attn_k_norm.weight
    F32
    [128]
  • blk.19.attn_norm.weight
    F32
    [4096]
  • blk.19.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.19.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.19.attn_q_norm.weight
    F32
    [128]
  • blk.19.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.19.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.19.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.19.ffn_norm.weight
    F32
    [4096]
  • blk.19.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.20
  • blk.20.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.20.attn_k_norm.weight
    F32
    [128]
  • blk.20.attn_norm.weight
    F32
    [4096]
  • blk.20.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.20.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.20.attn_q_norm.weight
    F32
    [128]
  • blk.20.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.20.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.20.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.20.ffn_norm.weight
    F32
    [4096]
  • blk.20.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.21
  • blk.21.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.21.attn_k_norm.weight
    F32
    [128]
  • blk.21.attn_norm.weight
    F32
    [4096]
  • blk.21.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.21.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.21.attn_q_norm.weight
    F32
    [128]
  • blk.21.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.21.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.21.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.21.ffn_norm.weight
    F32
    [4096]
  • blk.21.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.22
  • blk.22.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.22.attn_k_norm.weight
    F32
    [128]
  • blk.22.attn_norm.weight
    F32
    [4096]
  • blk.22.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.22.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.22.attn_q_norm.weight
    F32
    [128]
  • blk.22.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.22.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.22.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.22.ffn_norm.weight
    F32
    [4096]
  • blk.22.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.23
  • blk.23.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.23.attn_k_norm.weight
    F32
    [128]
  • blk.23.attn_norm.weight
    F32
    [4096]
  • blk.23.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.23.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.23.attn_q_norm.weight
    F32
    [128]
  • blk.23.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.23.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.23.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.23.ffn_norm.weight
    F32
    [4096]
  • blk.23.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.24
  • blk.24.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.24.attn_k_norm.weight
    F32
    [128]
  • blk.24.attn_norm.weight
    F32
    [4096]
  • blk.24.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.24.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.24.attn_q_norm.weight
    F32
    [128]
  • blk.24.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.24.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.24.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.24.ffn_norm.weight
    F32
    [4096]
  • blk.24.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.25
  • blk.25.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.25.attn_k_norm.weight
    F32
    [128]
  • blk.25.attn_norm.weight
    F32
    [4096]
  • blk.25.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.25.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.25.attn_q_norm.weight
    F32
    [128]
  • blk.25.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.25.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.25.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.25.ffn_norm.weight
    F32
    [4096]
  • blk.25.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.26
  • blk.26.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.26.attn_k_norm.weight
    F32
    [128]
  • blk.26.attn_norm.weight
    F32
    [4096]
  • blk.26.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.26.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.26.attn_q_norm.weight
    F32
    [128]
  • blk.26.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.26.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.26.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.26.ffn_norm.weight
    F32
    [4096]
  • blk.26.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.27
  • blk.27.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.27.attn_k_norm.weight
    F32
    [128]
  • blk.27.attn_norm.weight
    F32
    [4096]
  • blk.27.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.27.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.27.attn_q_norm.weight
    F32
    [128]
  • blk.27.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.27.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.27.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.27.ffn_norm.weight
    F32
    [4096]
  • blk.27.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.28
  • blk.28.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.28.attn_k_norm.weight
    F32
    [128]
  • blk.28.attn_norm.weight
    F32
    [4096]
  • blk.28.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.28.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.28.attn_q_norm.weight
    F32
    [128]
  • blk.28.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.28.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.28.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.28.ffn_norm.weight
    F32
    [4096]
  • blk.28.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.29
  • blk.29.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.29.attn_k_norm.weight
    F32
    [128]
  • blk.29.attn_norm.weight
    F32
    [4096]
  • blk.29.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.29.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.29.attn_q_norm.weight
    F32
    [128]
  • blk.29.attn_v.weight
    Q4_K
    [4096, 1024]
  • blk.29.ffn_down.weight
    Q4_K
    [12288, 4096]
  • blk.29.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.29.ffn_norm.weight
    F32
    [4096]
  • blk.29.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.30
  • blk.30.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.30.attn_k_norm.weight
    F32
    [128]
  • blk.30.attn_norm.weight
    F32
    [4096]
  • blk.30.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.30.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.30.attn_q_norm.weight
    F32
    [128]
  • blk.30.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.30.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.30.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.30.ffn_norm.weight
    F32
    [4096]
  • blk.30.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.31
  • blk.31.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.31.attn_k_norm.weight
    F32
    [128]
  • blk.31.attn_norm.weight
    F32
    [4096]
  • blk.31.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.31.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.31.attn_q_norm.weight
    F32
    [128]
  • blk.31.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.31.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.31.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.31.ffn_norm.weight
    F32
    [4096]
  • blk.31.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.32
  • blk.32.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.32.attn_k_norm.weight
    F32
    [128]
  • blk.32.attn_norm.weight
    F32
    [4096]
  • blk.32.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.32.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.32.attn_q_norm.weight
    F32
    [128]
  • blk.32.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.32.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.32.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.32.ffn_norm.weight
    F32
    [4096]
  • blk.32.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.33
  • blk.33.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.33.attn_k_norm.weight
    F32
    [128]
  • blk.33.attn_norm.weight
    F32
    [4096]
  • blk.33.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.33.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.33.attn_q_norm.weight
    F32
    [128]
  • blk.33.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.33.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.33.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.33.ffn_norm.weight
    F32
    [4096]
  • blk.33.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.34
  • blk.34.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.34.attn_k_norm.weight
    F32
    [128]
  • blk.34.attn_norm.weight
    F32
    [4096]
  • blk.34.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.34.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.34.attn_q_norm.weight
    F32
    [128]
  • blk.34.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.34.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.34.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.34.ffn_norm.weight
    F32
    [4096]
  • blk.34.ffn_up.weight
    Q4_K
    [4096, 12288]
  • blk.35
  • blk.35.attn_k.weight
    Q4_K
    [4096, 1024]
  • blk.35.attn_k_norm.weight
    F32
    [128]
  • blk.35.attn_norm.weight
    F32
    [4096]
  • blk.35.attn_output.weight
    Q4_K
    [4096, 4096]
  • blk.35.attn_q.weight
    Q4_K
    [4096, 4096]
  • blk.35.attn_q_norm.weight
    F32
    [128]
  • blk.35.attn_v.weight
    Q6_K
    [4096, 1024]
  • blk.35.ffn_down.weight
    Q6_K
    [12288, 4096]
  • blk.35.ffn_gate.weight
    Q4_K
    [4096, 12288]
  • blk.35.ffn_norm.weight
    F32
    [4096]
  • blk.35.ffn_up.weight
    Q4_K
    [4096, 12288]
  • output.weight
    Q6_K
    [4096, 151936]
  • output_norm.weight
    F32
    [4096]