I-quants for mistral-nemo-instruct-2407-abliterated
Tools
12B
4 Pulls Updated 3 days ago
0b147cb93224 · 6.8GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-09-02T22:41:38+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb3
-
general.architecturellama
-
general.file_typeIQ1_M
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ ĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[5120 131072]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ5_K[14336 5120]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.0.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.0.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.0.attn_v.weightQ5_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ5_K[14336 5120]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.1.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.1.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.1.attn_v.weightQ5_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ5_K[14336 5120]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.2.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.2.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.2.attn_v.weightQ5_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ5_K[14336 5120]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.3.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.3.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.3.attn_v.weightQ5_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ5_K[14336 5120]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.4.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.4.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.4.attn_v.weightQ5_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.5.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.5.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.5.attn_v.weightQ5_K[5120 1024]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.6.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.6.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.6.attn_v.weightQ5_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.6.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.7.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.7.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.7.attn_v.weightQ5_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.8.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.8.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.8.attn_v.weightQ5_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.9.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.9.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.9.attn_v.weightQ5_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.10.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.10.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.10.attn_v.weightQ5_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.11.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.11.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.11.attn_v.weightQ5_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.12.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.12.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.12.attn_v.weightQ5_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.13.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.13.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.13.attn_v.weightQ5_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.14.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.14.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.14.attn_v.weightQ5_K[5120 1024]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.15.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.15.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.15.attn_v.weightQ5_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.15.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.16.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.16.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.16.attn_v.weightQ5_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.17.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.17.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.17.attn_v.weightQ5_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.18.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.18.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.18.attn_v.weightQ5_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.19.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.19.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.19.attn_v.weightQ5_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.20.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.20.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.20.attn_v.weightQ5_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.21.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.21.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.21.attn_v.weightQ5_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.22.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.22.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.22.attn_v.weightQ5_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.23.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.23.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.23.attn_v.weightQ5_K[5120 1024]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.24.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.24.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.24.attn_v.weightQ5_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.24.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.25.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.25.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.25.attn_v.weightQ5_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.26.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.26.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.26.attn_v.weightQ5_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.27.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.27.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.27.attn_v.weightQ5_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.28.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.28.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.28.attn_v.weightQ5_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.29.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.29.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.29.attn_v.weightQ5_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.30.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.30.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.30.attn_v.weightQ5_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.31.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.31.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.31.attn_v.weightQ5_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.32.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.32.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.32.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.32.attn_v.weightQ5_K[5120 1024]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.33.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.33.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.33.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.33.attn_v.weightQ5_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.33.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.34.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.34.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.34.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.34.attn_v.weightQ5_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.35.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.35.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.35.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.35.attn_v.weightQ5_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.36.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.36.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.36.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.36.attn_v.weightQ5_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.37.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.37.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.37.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.37.attn_v.weightQ5_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.38.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.38.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.38.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.38.attn_v.weightQ5_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weight(!unknown_type 23!)[14336 5120]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[5120 14336]
-
blk.39.ffn_up.weight(!unknown_type 23!)[5120 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weight(!unknown_type 23!)[5120 1024]
-
blk.39.attn_output.weight(!unknown_type 23!)[4096 5120]
-
blk.39.attn_q.weight(!unknown_type 23!)[5120 4096]
-
blk.39.attn_v.weightQ5_K[5120 1024]
-
output.weightQ6_K[5120 131072]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39