I-quants for mistral-nemo-instruct-2407-abliterated
tools
141 Pulls Updated 8 weeks ago
0b147cb93224 · 6.8GB
-
general.architecturellama
-
general.basenameMistral
-
general.file_type30
-
general.finetuneInstruct
-
general.languages[en, fr, de, es, it, ...]
-
general.licenseapache-2.0
-
general.nameMistral 7B Instruct v0.1
-
general.organizationMistralai
-
general.quantization_version2
-
general.size_label7B
-
general.source.urlhttps://huggingface.co/natong19/Mistral-Nemo-Instruct-2407-abliterated
-
general.typemodel
-
general.urlhttps://huggingface.co/mradermacher/Mistral-Nemo-Instruct-2407-abliterated-GGUF
-
general.versionv0.1
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-09-02T22:41:38+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb3
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[Ġ Ġ, Ġ t, e r, i n, Ġ ĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3, 3, 3, 3, 3, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, [INST], [/INST], ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[5120, 131072]
-
blk.0.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.0.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.0.attn_v.weightQ5_K[5120, 1024]
-
blk.0.ffn_down.weightQ5_K[14336, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.1.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.1.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.1.attn_v.weightQ5_K[5120, 1024]
-
blk.1.ffn_down.weightQ5_K[14336, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.2.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.2.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.2.attn_v.weightQ5_K[5120, 1024]
-
blk.2.ffn_down.weightQ5_K[14336, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.3.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.3.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.3.attn_v.weightQ5_K[5120, 1024]
-
blk.3.ffn_down.weightQ5_K[14336, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.4.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.4.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.4.attn_v.weightQ5_K[5120, 1024]
-
blk.4.ffn_down.weightQ5_K[14336, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.5.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.5.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.5.attn_v.weightQ5_K[5120, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.6.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.6.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.6.attn_v.weightQ5_K[5120, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.7.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.7.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.7.attn_v.weightQ5_K[5120, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.8.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.8.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.8.attn_v.weightQ5_K[5120, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.9.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.9.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.9.attn_v.weightQ5_K[5120, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.10.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.10.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.10.attn_v.weightQ5_K[5120, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.11.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.11.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.11.attn_v.weightQ5_K[5120, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.12.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.12.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.12.attn_v.weightQ5_K[5120, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.13.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.13.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.13.attn_v.weightQ5_K[5120, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.14.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.14.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.14.attn_v.weightQ5_K[5120, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.15.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.15.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.15.attn_v.weightQ5_K[5120, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.16.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.16.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.16.attn_v.weightQ5_K[5120, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.17.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.17.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.17.attn_v.weightQ5_K[5120, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.18.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.18.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.18.attn_v.weightQ5_K[5120, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.19.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.19.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.19.attn_v.weightQ5_K[5120, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.20.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.20.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.20.attn_v.weightQ5_K[5120, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.21.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.21.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.21.attn_v.weightQ5_K[5120, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.22.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.22.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.22.attn_v.weightQ5_K[5120, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.23.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.23.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.23.attn_v.weightQ5_K[5120, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.24.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.24.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.24.attn_v.weightQ5_K[5120, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.25.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.25.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.25.attn_v.weightQ5_K[5120, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.26.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.26.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.26.attn_v.weightQ5_K[5120, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.27.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.27.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.27.attn_v.weightQ5_K[5120, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.28.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.28.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.28.attn_v.weightQ5_K[5120, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.29.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.29.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.29.attn_v.weightQ5_K[5120, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.30.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.30.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.30.attn_v.weightQ5_K[5120, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.31.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.31.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.31.attn_v.weightQ5_K[5120, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.32.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.32.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.32.attn_v.weightQ5_K[5120, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.33.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.33.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.33.attn_v.weightQ5_K[5120, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.34.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.34.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.34.attn_v.weightQ5_K[5120, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.35.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.35.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.35.attn_v.weightQ5_K[5120, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.36.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.36.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.36.attn_v.weightQ5_K[5120, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.37.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.37.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.37.attn_v.weightQ5_K[5120, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.38.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.38.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.38.attn_v.weightQ5_K[5120, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
blk.39.attn_k.weight(!unknown_type 23!)[5120, 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 23!)[4096, 5120]
-
blk.39.attn_q.weight(!unknown_type 23!)[5120, 4096]
-
blk.39.attn_v.weightQ5_K[5120, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[14336, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[5120, 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 23!)[5120, 14336]
-
output.weightQ6_K[5120, 131072]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39