thanks to bartowski for quants on HF
140 Pulls Updated 5 months ago
6691588c1e19 · 4.8GB
-
general.architecturellama
-
general.file_type29
-
general.namedolphin-2.9.2-Phi-3-Medium
-
general.quantization_version2
-
llama.attention.head_count40
-
llama.attention.head_count_kv10
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length17920
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count151
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count280
-
quantize.imatrix.file/models/dolphin-2.9.2-Phi-3-Medium-GGUF/dolphin-2.9.2-Phi-3-Medium.imatrix
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32011
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32009
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120, 32064]
-
blk.0.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.0.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.0.attn_v.weightQ4_K[5120, 1280]
-
blk.0.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.1.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.1.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.1.attn_v.weightQ4_K[5120, 1280]
-
blk.1.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.2.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.2.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.2.attn_v.weightQ4_K[5120, 1280]
-
blk.2.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.3.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.3.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.3.attn_v.weightQ4_K[5120, 1280]
-
blk.3.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.4.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.4.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.4.attn_v.weightQ4_K[5120, 1280]
-
blk.4.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.5.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.5.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.5.attn_v.weightQ4_K[5120, 1280]
-
blk.5.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.6.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.6.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.6.attn_v.weightQ4_K[5120, 1280]
-
blk.6.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.7.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.7.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.7.attn_v.weightQ4_K[5120, 1280]
-
blk.7.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.8.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.8.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.8.attn_v.weightQ4_K[5120, 1280]
-
blk.8.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.9.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.9.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.9.attn_v.weightQ4_K[5120, 1280]
-
blk.9.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.10.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.10.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.10.attn_v.weightQ4_K[5120, 1280]
-
blk.10.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.11.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.11.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.11.attn_v.weightQ4_K[5120, 1280]
-
blk.11.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.12.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.12.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.12.attn_v.weightQ4_K[5120, 1280]
-
blk.12.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.13.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.13.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.13.attn_v.weightQ4_K[5120, 1280]
-
blk.13.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.14.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.14.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.14.attn_v.weightQ4_K[5120, 1280]
-
blk.14.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.15.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.15.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.15.attn_v.weightQ4_K[5120, 1280]
-
blk.15.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.16.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.16.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.16.attn_v.weightQ4_K[5120, 1280]
-
blk.16.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.17.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.17.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.17.attn_v.weightQ4_K[5120, 1280]
-
blk.17.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.18.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.18.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.18.attn_v.weightQ4_K[5120, 1280]
-
blk.18.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.19.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.19.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.19.attn_v.weightQ4_K[5120, 1280]
-
blk.19.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.20.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.20.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.20.attn_v.weightQ4_K[5120, 1280]
-
blk.20.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.21.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.21.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.21.attn_v.weightQ4_K[5120, 1280]
-
blk.21.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.22.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.22.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.22.attn_v.weightQ4_K[5120, 1280]
-
blk.22.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.23.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.23.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.23.attn_v.weightQ4_K[5120, 1280]
-
blk.23.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.24.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.24.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.24.attn_v.weightQ4_K[5120, 1280]
-
blk.24.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.25.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.25.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.25.attn_v.weightQ4_K[5120, 1280]
-
blk.25.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.26.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.26.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.26.attn_v.weightQ4_K[5120, 1280]
-
blk.26.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.27.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.27.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.27.attn_v.weightQ4_K[5120, 1280]
-
blk.27.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.28.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.28.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.28.attn_v.weightQ4_K[5120, 1280]
-
blk.28.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.29.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.29.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.29.attn_v.weightQ4_K[5120, 1280]
-
blk.29.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.30.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.30.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.30.attn_v.weightQ4_K[5120, 1280]
-
blk.30.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.31.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.31.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.31.attn_v.weightQ4_K[5120, 1280]
-
blk.31.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.32.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.32.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.32.attn_v.weightQ4_K[5120, 1280]
-
blk.32.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.33.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.33.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.33.attn_v.weightQ4_K[5120, 1280]
-
blk.33.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.34.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.34.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.34.attn_v.weightQ4_K[5120, 1280]
-
blk.34.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.35.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.35.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.35.attn_v.weightQ4_K[5120, 1280]
-
blk.35.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.36.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.36.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.36.attn_v.weightQ4_K[5120, 1280]
-
blk.36.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.37.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.37.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.37.attn_v.weightQ4_K[5120, 1280]
-
blk.37.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.38.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.38.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.38.attn_v.weightQ4_K[5120, 1280]
-
blk.38.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
blk.39.attn_k.weight(!unknown_type 22!)[5120, 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.39.attn_q.weight(!unknown_type 22!)[5120, 5120]
-
blk.39.attn_v.weightQ4_K[5120, 1280]
-
blk.39.ffn_down.weight(!unknown_type 22!)[17920, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 22!)[5120, 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 22!)[5120, 17920]
-
output.weightQ5_K[5120, 32064]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39