I-quants for mistral-nemo-instruct-2407-abliterated
Tools
12B
4 Pulls Updated 3 days ago
775cb55890ba · 5.3GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-09-02T22:32:42+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb3
-
general.architecturellama
-
general.file_typeIQ3_XS
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ ĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120 131072]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightI32[5120 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.0.attn_q.weightI32[5120 4096]
-
blk.0.attn_v.weightQ4_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightI32[5120 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.1.attn_q.weightI32[5120 4096]
-
blk.1.attn_v.weightQ4_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.2.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightI32[5120 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.2.attn_q.weightI32[5120 4096]
-
blk.2.attn_v.weightQ4_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.3.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightI32[5120 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.3.attn_q.weightI32[5120 4096]
-
blk.3.attn_v.weightQ4_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.4.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightI32[5120 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.4.attn_q.weightI32[5120 4096]
-
blk.4.attn_v.weightQ4_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.5.ffn_gate.weightI32[5120 14336]
-
blk.5.ffn_up.weightI32[5120 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightI32[5120 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.5.attn_q.weightI32[5120 4096]
-
blk.5.attn_v.weightQ4_K[5120 1024]
-
blk.6.ffn_gate.weightI32[5120 14336]
-
blk.6.attn_k.weightI32[5120 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.6.attn_q.weightI32[5120 4096]
-
blk.6.attn_v.weightQ4_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.6.ffn_up.weightI32[5120 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.7.ffn_gate.weightI32[5120 14336]
-
blk.7.ffn_up.weightI32[5120 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightI32[5120 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.7.attn_q.weightI32[5120 4096]
-
blk.7.attn_v.weightQ4_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.8.ffn_gate.weightI32[5120 14336]
-
blk.8.ffn_up.weightI32[5120 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightI32[5120 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.8.attn_q.weightI32[5120 4096]
-
blk.8.attn_v.weightQ4_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.9.ffn_gate.weightI32[5120 14336]
-
blk.9.ffn_up.weightI32[5120 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightI32[5120 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.9.attn_q.weightI32[5120 4096]
-
blk.9.attn_v.weightQ4_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.10.ffn_gate.weightI32[5120 14336]
-
blk.10.ffn_up.weightI32[5120 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightI32[5120 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.10.attn_q.weightI32[5120 4096]
-
blk.10.attn_v.weightQ4_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.11.ffn_gate.weightI32[5120 14336]
-
blk.11.ffn_up.weightI32[5120 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightI32[5120 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.11.attn_q.weightI32[5120 4096]
-
blk.11.attn_v.weightQ4_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.12.ffn_gate.weightI32[5120 14336]
-
blk.12.ffn_up.weightI32[5120 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightI32[5120 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.12.attn_q.weightI32[5120 4096]
-
blk.12.attn_v.weightQ4_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.13.ffn_gate.weightI32[5120 14336]
-
blk.13.ffn_up.weightI32[5120 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightI32[5120 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.13.attn_q.weightI32[5120 4096]
-
blk.13.attn_v.weightQ4_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.14.ffn_gate.weightI32[5120 14336]
-
blk.14.ffn_up.weightI32[5120 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightI32[5120 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.14.attn_q.weightI32[5120 4096]
-
blk.14.attn_v.weightQ4_K[5120 1024]
-
blk.15.ffn_gate.weightI32[5120 14336]
-
blk.15.attn_k.weightI32[5120 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.15.attn_q.weightI32[5120 4096]
-
blk.15.attn_v.weightQ4_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.15.ffn_up.weightI32[5120 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.16.ffn_gate.weightI32[5120 14336]
-
blk.16.ffn_up.weightI32[5120 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightI32[5120 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.16.attn_q.weightI32[5120 4096]
-
blk.16.attn_v.weightQ4_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.17.ffn_gate.weightI32[5120 14336]
-
blk.17.ffn_up.weightI32[5120 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightI32[5120 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.17.attn_q.weightI32[5120 4096]
-
blk.17.attn_v.weightQ4_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.18.ffn_gate.weightI32[5120 14336]
-
blk.18.ffn_up.weightI32[5120 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightI32[5120 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.18.attn_q.weightI32[5120 4096]
-
blk.18.attn_v.weightQ4_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.19.ffn_gate.weightI32[5120 14336]
-
blk.19.ffn_up.weightI32[5120 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightI32[5120 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.19.attn_q.weightI32[5120 4096]
-
blk.19.attn_v.weightQ4_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.20.ffn_gate.weightI32[5120 14336]
-
blk.20.ffn_up.weightI32[5120 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightI32[5120 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.20.attn_q.weightI32[5120 4096]
-
blk.20.attn_v.weightQ4_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.21.ffn_gate.weightI32[5120 14336]
-
blk.21.ffn_up.weightI32[5120 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weightI32[5120 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.21.attn_q.weightI32[5120 4096]
-
blk.21.attn_v.weightQ4_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.22.ffn_gate.weightI32[5120 14336]
-
blk.22.ffn_up.weightI32[5120 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightI32[5120 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.22.attn_q.weightI32[5120 4096]
-
blk.22.attn_v.weightQ4_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.23.ffn_gate.weightI32[5120 14336]
-
blk.23.ffn_up.weightI32[5120 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightI32[5120 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.23.attn_q.weightI32[5120 4096]
-
blk.23.attn_v.weightQ4_K[5120 1024]
-
blk.24.ffn_gate.weightI32[5120 14336]
-
blk.24.attn_k.weightI32[5120 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.24.attn_q.weightI32[5120 4096]
-
blk.24.attn_v.weightQ4_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.24.ffn_up.weightI32[5120 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.25.ffn_gate.weightI32[5120 14336]
-
blk.25.ffn_up.weightI32[5120 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightI32[5120 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.25.attn_q.weightI32[5120 4096]
-
blk.25.attn_v.weightQ4_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.26.ffn_gate.weightI32[5120 14336]
-
blk.26.ffn_up.weightI32[5120 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightI32[5120 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.26.attn_q.weightI32[5120 4096]
-
blk.26.attn_v.weightQ4_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.27.ffn_gate.weightI32[5120 14336]
-
blk.27.ffn_up.weightI32[5120 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightI32[5120 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.27.attn_q.weightI32[5120 4096]
-
blk.27.attn_v.weightQ4_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.28.ffn_gate.weightI32[5120 14336]
-
blk.28.ffn_up.weightI32[5120 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weightI32[5120 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.28.attn_q.weightI32[5120 4096]
-
blk.28.attn_v.weightQ4_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.29.ffn_gate.weightI32[5120 14336]
-
blk.29.ffn_up.weightI32[5120 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightI32[5120 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.29.attn_q.weightI32[5120 4096]
-
blk.29.attn_v.weightQ4_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.30.ffn_gate.weightI32[5120 14336]
-
blk.30.ffn_up.weightI32[5120 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weightI32[5120 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.30.attn_q.weightI32[5120 4096]
-
blk.30.attn_v.weightQ4_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.31.ffn_gate.weightI32[5120 14336]
-
blk.31.ffn_up.weightI32[5120 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightI32[5120 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.31.attn_q.weightI32[5120 4096]
-
blk.31.attn_v.weightQ4_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.32.ffn_gate.weightI32[5120 14336]
-
blk.32.ffn_up.weightI32[5120 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightI32[5120 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.32.attn_q.weightI32[5120 4096]
-
blk.32.attn_v.weightQ4_K[5120 1024]
-
blk.33.ffn_gate.weightI32[5120 14336]
-
blk.33.attn_k.weightI32[5120 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.33.attn_q.weightI32[5120 4096]
-
blk.33.attn_v.weightQ4_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.33.ffn_up.weightI32[5120 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.34.ffn_gate.weightI32[5120 14336]
-
blk.34.ffn_up.weightI32[5120 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightI32[5120 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.34.attn_q.weightI32[5120 4096]
-
blk.34.attn_v.weightQ4_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.35.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weightI32[5120 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.35.attn_q.weightI32[5120 4096]
-
blk.35.attn_v.weightQ4_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.36.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightI32[5120 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.36.attn_q.weightI32[5120 4096]
-
blk.36.attn_v.weightQ4_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.37.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightI32[5120 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.37.attn_q.weightI32[5120 4096]
-
blk.37.attn_v.weightQ4_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.38.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightI32[5120 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.38.attn_q.weightI32[5120 4096]
-
blk.38.attn_v.weightQ4_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weight(!unknown_type 21!)[14336 5120]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[5120 14336]
-
blk.39.ffn_up.weight(!unknown_type 21!)[5120 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightI32[5120 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[4096 5120]
-
blk.39.attn_q.weightI32[5120 4096]
-
blk.39.attn_v.weightQ4_K[5120 1024]
-
output.weightQ6_K[5120 131072]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39