I-quants for mistral-nemo-instruct-2407-abliterated
Tools
12B
4 Pulls Updated 3 days ago
73e812175108 · 5.7GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-09-02T22:20:26+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb3
-
general.architecturellama
-
general.file_typeIQ2_S
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ ĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120 131072]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ4_K[14336 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.0.attn_output.weightQ4_K[4096 5120]
-
blk.0.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ4_K[14336 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.1.attn_output.weightQ4_K[4096 5120]
-
blk.1.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ4_K[14336 5120]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.2.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.2.attn_output.weightQ4_K[4096 5120]
-
blk.2.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_K[14336 5120]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.3.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.3.attn_output.weightQ4_K[4096 5120]
-
blk.3.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_K[14336 5120]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.4.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.4.attn_output.weightQ4_K[4096 5120]
-
blk.4.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.5.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.5.attn_output.weightQ4_K[4096 5120]
-
blk.5.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.6.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.6.attn_output.weightQ4_K[4096 5120]
-
blk.6.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.6.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.7.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.7.attn_output.weightQ4_K[4096 5120]
-
blk.7.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.8.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.8.attn_output.weightQ4_K[4096 5120]
-
blk.8.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.9.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.9.attn_output.weightQ4_K[4096 5120]
-
blk.9.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.10.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.10.attn_output.weightQ4_K[4096 5120]
-
blk.10.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.11.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.11.attn_output.weightQ4_K[4096 5120]
-
blk.11.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.12.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.12.attn_output.weightQ4_K[4096 5120]
-
blk.12.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.13.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.13.attn_output.weightQ4_K[4096 5120]
-
blk.13.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.14.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.14.attn_output.weightQ4_K[4096 5120]
-
blk.14.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.15.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.15.attn_output.weightQ4_K[4096 5120]
-
blk.15.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.15.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.16.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.16.attn_output.weightQ4_K[4096 5120]
-
blk.16.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.17.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.17.attn_output.weightQ4_K[4096 5120]
-
blk.17.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.18.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.18.attn_output.weightQ4_K[4096 5120]
-
blk.18.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.19.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.19.attn_output.weightQ4_K[4096 5120]
-
blk.19.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.20.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.20.attn_output.weightQ4_K[4096 5120]
-
blk.20.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.21.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.21.attn_output.weightQ4_K[4096 5120]
-
blk.21.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.22.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.22.attn_output.weightQ4_K[4096 5120]
-
blk.22.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.23.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.23.attn_output.weightQ4_K[4096 5120]
-
blk.23.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.24.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.24.attn_output.weightQ4_K[4096 5120]
-
blk.24.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.24.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.25.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.25.attn_output.weightQ4_K[4096 5120]
-
blk.25.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.26.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.26.attn_output.weightQ4_K[4096 5120]
-
blk.26.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.27.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.27.attn_output.weightQ4_K[4096 5120]
-
blk.27.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.28.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.28.attn_output.weightQ4_K[4096 5120]
-
blk.28.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.29.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.29.attn_output.weightQ4_K[4096 5120]
-
blk.29.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.30.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.30.attn_output.weightQ4_K[4096 5120]
-
blk.30.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.31.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.31.attn_output.weightQ4_K[4096 5120]
-
blk.31.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.32.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.32.attn_output.weightQ4_K[4096 5120]
-
blk.32.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.33.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.33.attn_output.weightQ4_K[4096 5120]
-
blk.33.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.33.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.34.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.34.attn_output.weightQ4_K[4096 5120]
-
blk.34.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.35.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.35.attn_output.weightQ4_K[4096 5120]
-
blk.35.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.36.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.36.attn_output.weightQ4_K[4096 5120]
-
blk.36.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.37.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.37.attn_output.weightQ4_K[4096 5120]
-
blk.37.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.38.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.38.attn_output.weightQ4_K[4096 5120]
-
blk.38.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.39.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weight(!unknown_type 21!)[5120 1024]
-
blk.39.attn_output.weightQ4_K[4096 5120]
-
blk.39.attn_q.weight(!unknown_type 21!)[5120 4096]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
output.weightQ6_K[5120 131072]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39