thanks to bartowski for quants on HF
143 Pulls Updated 5 months ago
b869266dcc0f · 6.3GB
-
general.architecturellama
-
general.file_type27
-
general.namedolphin-2.9.2-Phi-3-Medium
-
general.quantization_version2
-
llama.attention.head_count40
-
llama.attention.head_count_kv10
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length17920
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count151
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count280
-
quantize.imatrix.file/models/dolphin-2.9.2-Phi-3-Medium-GGUF/dolphin-2.9.2-Phi-3-Medium.imatrix
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32011
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32009
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120, 32064]
-
blk.0.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ4_K[5120, 5120]
-
blk.0.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.0.attn_v.weightQ4_K[5120, 1280]
-
blk.0.ffn_down.weightQ4_K[17920, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.1.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ4_K[5120, 5120]
-
blk.1.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.1.attn_v.weightQ4_K[5120, 1280]
-
blk.1.ffn_down.weightQ4_K[17920, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.2.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ4_K[5120, 5120]
-
blk.2.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.2.attn_v.weightQ4_K[5120, 1280]
-
blk.2.ffn_down.weightQ4_K[17920, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.3.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ4_K[5120, 5120]
-
blk.3.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.3.attn_v.weightQ4_K[5120, 1280]
-
blk.3.ffn_down.weightQ4_K[17920, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.4.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ4_K[5120, 5120]
-
blk.4.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.4.attn_v.weightQ4_K[5120, 1280]
-
blk.4.ffn_down.weightQ4_K[17920, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.5.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ4_K[5120, 5120]
-
blk.5.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.5.attn_v.weightQ4_K[5120, 1280]
-
blk.5.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.6.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weightQ4_K[5120, 5120]
-
blk.6.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.6.attn_v.weightQ4_K[5120, 1280]
-
blk.6.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.7.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ4_K[5120, 5120]
-
blk.7.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.7.attn_v.weightQ4_K[5120, 1280]
-
blk.7.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.8.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ4_K[5120, 5120]
-
blk.8.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.8.attn_v.weightQ4_K[5120, 1280]
-
blk.8.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.9.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ4_K[5120, 5120]
-
blk.9.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.9.attn_v.weightQ4_K[5120, 1280]
-
blk.9.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.10.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ4_K[5120, 5120]
-
blk.10.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.10.attn_v.weightQ4_K[5120, 1280]
-
blk.10.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.11.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ4_K[5120, 5120]
-
blk.11.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.11.attn_v.weightQ4_K[5120, 1280]
-
blk.11.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.12.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ4_K[5120, 5120]
-
blk.12.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.12.attn_v.weightQ4_K[5120, 1280]
-
blk.12.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.13.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ4_K[5120, 5120]
-
blk.13.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.13.attn_v.weightQ4_K[5120, 1280]
-
blk.13.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.14.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ4_K[5120, 5120]
-
blk.14.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.14.attn_v.weightQ4_K[5120, 1280]
-
blk.14.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.15.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_K[5120, 5120]
-
blk.15.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.15.attn_v.weightQ4_K[5120, 1280]
-
blk.15.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.16.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ4_K[5120, 5120]
-
blk.16.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.16.attn_v.weightQ4_K[5120, 1280]
-
blk.16.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.17.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ4_K[5120, 5120]
-
blk.17.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.17.attn_v.weightQ4_K[5120, 1280]
-
blk.17.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.18.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ4_K[5120, 5120]
-
blk.18.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.18.attn_v.weightQ4_K[5120, 1280]
-
blk.18.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.19.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ4_K[5120, 5120]
-
blk.19.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.19.attn_v.weightQ4_K[5120, 1280]
-
blk.19.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.20.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ4_K[5120, 5120]
-
blk.20.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.20.attn_v.weightQ4_K[5120, 1280]
-
blk.20.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.21.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weightQ4_K[5120, 5120]
-
blk.21.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.21.attn_v.weightQ4_K[5120, 1280]
-
blk.21.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.22.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ4_K[5120, 5120]
-
blk.22.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.22.attn_v.weightQ4_K[5120, 1280]
-
blk.22.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.23.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ4_K[5120, 5120]
-
blk.23.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.23.attn_v.weightQ4_K[5120, 1280]
-
blk.23.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.24.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ4_K[5120, 5120]
-
blk.24.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.24.attn_v.weightQ4_K[5120, 1280]
-
blk.24.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.25.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ4_K[5120, 5120]
-
blk.25.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.25.attn_v.weightQ4_K[5120, 1280]
-
blk.25.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.26.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ4_K[5120, 5120]
-
blk.26.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.26.attn_v.weightQ4_K[5120, 1280]
-
blk.26.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.27.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ4_K[5120, 5120]
-
blk.27.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.27.attn_v.weightQ4_K[5120, 1280]
-
blk.27.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.28.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weightQ4_K[5120, 5120]
-
blk.28.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.28.attn_v.weightQ4_K[5120, 1280]
-
blk.28.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.29.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ4_K[5120, 5120]
-
blk.29.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.29.attn_v.weightQ4_K[5120, 1280]
-
blk.29.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.30.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ4_K[5120, 5120]
-
blk.30.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.30.attn_v.weightQ4_K[5120, 1280]
-
blk.30.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.31.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ4_K[5120, 5120]
-
blk.31.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.31.attn_v.weightQ4_K[5120, 1280]
-
blk.31.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.32.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ4_K[5120, 5120]
-
blk.32.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.32.attn_v.weightQ4_K[5120, 1280]
-
blk.32.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.33.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ4_K[5120, 5120]
-
blk.33.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.33.attn_v.weightQ4_K[5120, 1280]
-
blk.33.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.34.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ4_K[5120, 5120]
-
blk.34.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.34.attn_v.weightQ4_K[5120, 1280]
-
blk.34.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.35.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weightQ4_K[5120, 5120]
-
blk.35.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.35.attn_v.weightQ4_K[5120, 1280]
-
blk.35.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.36.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ4_K[5120, 5120]
-
blk.36.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.36.attn_v.weightQ4_K[5120, 1280]
-
blk.36.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.37.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ4_K[5120, 5120]
-
blk.37.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.37.attn_v.weightQ4_K[5120, 1280]
-
blk.37.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.38.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ4_K[5120, 5120]
-
blk.38.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.38.attn_v.weightQ4_K[5120, 1280]
-
blk.38.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.39.attn_k.weight(!unknown_type 21!)[5120, 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ4_K[5120, 5120]
-
blk.39.attn_q.weight(!unknown_type 21!)[5120, 5120]
-
blk.39.attn_v.weightQ4_K[5120, 1280]
-
blk.39.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
output.weightQ6_K[5120, 32064]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39