I-quants for mistral-nemo-instruct-2407-abliterated
tools
141 Pulls Updated 8 weeks ago
73e812175108 · 5.7GB
-
general.architecturellama
-
general.basenameMistral
-
general.file_type27
-
general.finetuneInstruct
-
general.languages[en, fr, de, es, it, ...]
-
general.licenseapache-2.0
-
general.nameMistral 7B Instruct v0.1
-
general.organizationMistralai
-
general.quantization_version2
-
general.size_label7B
-
general.source.urlhttps://huggingface.co/natong19/Mistral-Nemo-Instruct-2407-abliterated
-
general.typemodel
-
general.urlhttps://huggingface.co/mradermacher/Mistral-Nemo-Instruct-2407-abliterated-GGUF
-
general.versionv0.1
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-09-02T22:20:26+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb3
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[Ġ Ġ, Ġ t, e r, i n, Ġ ĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3, 3, 3, 3, 3, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, [INST], [/INST], ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120, 131072]
-
blk.0.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ4_K[4096, 5120]
-
blk.0.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.0.attn_v.weightQ4_K[5120, 1024]
-
blk.0.ffn_down.weightQ4_K[14336, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.1.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ4_K[4096, 5120]
-
blk.1.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.1.attn_v.weightQ4_K[5120, 1024]
-
blk.1.ffn_down.weightQ4_K[14336, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.2.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ4_K[4096, 5120]
-
blk.2.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.2.attn_v.weightQ4_K[5120, 1024]
-
blk.2.ffn_down.weightQ4_K[14336, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.3.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ4_K[4096, 5120]
-
blk.3.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.3.attn_v.weightQ4_K[5120, 1024]
-
blk.3.ffn_down.weightQ4_K[14336, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.4.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ4_K[4096, 5120]
-
blk.4.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.4.attn_v.weightQ4_K[5120, 1024]
-
blk.4.ffn_down.weightQ4_K[14336, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.5.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ4_K[4096, 5120]
-
blk.5.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.5.attn_v.weightQ4_K[5120, 1024]
-
blk.5.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.6.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weightQ4_K[4096, 5120]
-
blk.6.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.6.attn_v.weightQ4_K[5120, 1024]
-
blk.6.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.7.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ4_K[4096, 5120]
-
blk.7.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.7.attn_v.weightQ4_K[5120, 1024]
-
blk.7.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.8.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ4_K[4096, 5120]
-
blk.8.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.8.attn_v.weightQ4_K[5120, 1024]
-
blk.8.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.9.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ4_K[4096, 5120]
-
blk.9.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.9.attn_v.weightQ4_K[5120, 1024]
-
blk.9.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.10.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ4_K[4096, 5120]
-
blk.10.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.10.attn_v.weightQ4_K[5120, 1024]
-
blk.10.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.11.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ4_K[4096, 5120]
-
blk.11.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.11.attn_v.weightQ4_K[5120, 1024]
-
blk.11.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.12.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ4_K[4096, 5120]
-
blk.12.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.12.attn_v.weightQ4_K[5120, 1024]
-
blk.12.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.13.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ4_K[4096, 5120]
-
blk.13.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.13.attn_v.weightQ4_K[5120, 1024]
-
blk.13.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.14.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ4_K[4096, 5120]
-
blk.14.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.14.attn_v.weightQ4_K[5120, 1024]
-
blk.14.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.15.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_K[4096, 5120]
-
blk.15.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.15.attn_v.weightQ4_K[5120, 1024]
-
blk.15.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.16.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ4_K[4096, 5120]
-
blk.16.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.16.attn_v.weightQ4_K[5120, 1024]
-
blk.16.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.17.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ4_K[4096, 5120]
-
blk.17.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.17.attn_v.weightQ4_K[5120, 1024]
-
blk.17.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.18.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ4_K[4096, 5120]
-
blk.18.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.18.attn_v.weightQ4_K[5120, 1024]
-
blk.18.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.19.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ4_K[4096, 5120]
-
blk.19.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.19.attn_v.weightQ4_K[5120, 1024]
-
blk.19.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.20.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ4_K[4096, 5120]
-
blk.20.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.20.attn_v.weightQ4_K[5120, 1024]
-
blk.20.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.21.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weightQ4_K[4096, 5120]
-
blk.21.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.21.attn_v.weightQ4_K[5120, 1024]
-
blk.21.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.22.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ4_K[4096, 5120]
-
blk.22.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.22.attn_v.weightQ4_K[5120, 1024]
-
blk.22.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.23.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ4_K[4096, 5120]
-
blk.23.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.23.attn_v.weightQ4_K[5120, 1024]
-
blk.23.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.24.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ4_K[4096, 5120]
-
blk.24.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.24.attn_v.weightQ4_K[5120, 1024]
-
blk.24.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.25.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ4_K[4096, 5120]
-
blk.25.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.25.attn_v.weightQ4_K[5120, 1024]
-
blk.25.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.26.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ4_K[4096, 5120]
-
blk.26.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.26.attn_v.weightQ4_K[5120, 1024]
-
blk.26.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.27.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ4_K[4096, 5120]
-
blk.27.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.27.attn_v.weightQ4_K[5120, 1024]
-
blk.27.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.28.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weightQ4_K[4096, 5120]
-
blk.28.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.28.attn_v.weightQ4_K[5120, 1024]
-
blk.28.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.29.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ4_K[4096, 5120]
-
blk.29.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.29.attn_v.weightQ4_K[5120, 1024]
-
blk.29.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.30.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ4_K[4096, 5120]
-
blk.30.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.30.attn_v.weightQ4_K[5120, 1024]
-
blk.30.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.31.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ4_K[4096, 5120]
-
blk.31.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.31.attn_v.weightQ4_K[5120, 1024]
-
blk.31.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.32.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ4_K[4096, 5120]
-
blk.32.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.32.attn_v.weightQ4_K[5120, 1024]
-
blk.32.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.33.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ4_K[4096, 5120]
-
blk.33.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.33.attn_v.weightQ4_K[5120, 1024]
-
blk.33.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.34.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ4_K[4096, 5120]
-
blk.34.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.34.attn_v.weightQ4_K[5120, 1024]
-
blk.34.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.35.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weightQ4_K[4096, 5120]
-
blk.35.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.35.attn_v.weightQ4_K[5120, 1024]
-
blk.35.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.36.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ4_K[4096, 5120]
-
blk.36.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.36.attn_v.weightQ4_K[5120, 1024]
-
blk.36.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.37.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ4_K[4096, 5120]
-
blk.37.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.37.attn_v.weightQ4_K[5120, 1024]
-
blk.37.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.38.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ4_K[4096, 5120]
-
blk.38.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.38.attn_v.weightQ4_K[5120, 1024]
-
blk.38.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
blk.39.attn_k.weight(!unknown_type 21!)[5120, 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ4_K[4096, 5120]
-
blk.39.attn_q.weight(!unknown_type 21!)[5120, 4096]
-
blk.39.attn_v.weightQ4_K[5120, 1024]
-
blk.39.ffn_down.weight(!unknown_type 21!)[14336, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[5120, 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 21!)[5120, 14336]
-
output.weightQ6_K[5120, 131072]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39