thanks to bartowski for quants on HF
140 Pulls Updated 5 months ago
35c1dc281377 · 5.8GB
-
general.architecturellama
-
general.file_type22
-
general.namedolphin-2.9.2-Phi-3-Medium
-
general.quantization_version2
-
llama.attention.head_count40
-
llama.attention.head_count_kv10
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length17920
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count151
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count280
-
quantize.imatrix.file/models/dolphin-2.9.2-Phi-3-Medium-GGUF/dolphin-2.9.2-Phi-3-Medium.imatrix
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32011
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32009
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[5120, 32064]
-
blk.0.attn_k.weightI32[5120, 1280]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.0.attn_q.weightI32[5120, 5120]
-
blk.0.attn_v.weightQ4_K[5120, 1280]
-
blk.0.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.1.attn_k.weightI32[5120, 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.1.attn_q.weightI32[5120, 5120]
-
blk.1.attn_v.weightQ4_K[5120, 1280]
-
blk.1.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.2.attn_k.weightI32[5120, 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.2.attn_q.weightI32[5120, 5120]
-
blk.2.attn_v.weightQ4_K[5120, 1280]
-
blk.2.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.3.attn_k.weightI32[5120, 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.3.attn_q.weightI32[5120, 5120]
-
blk.3.attn_v.weightQ4_K[5120, 1280]
-
blk.3.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.4.attn_k.weightI32[5120, 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.4.attn_q.weightI32[5120, 5120]
-
blk.4.attn_v.weightQ4_K[5120, 1280]
-
blk.4.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.5.attn_k.weightI32[5120, 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.5.attn_q.weightI32[5120, 5120]
-
blk.5.attn_v.weightQ4_K[5120, 1280]
-
blk.5.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.5.ffn_gate.weightI32[5120, 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weightI32[5120, 17920]
-
blk.6.attn_k.weightI32[5120, 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.6.attn_q.weightI32[5120, 5120]
-
blk.6.attn_v.weightQ4_K[5120, 1280]
-
blk.6.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.6.ffn_gate.weightI32[5120, 17920]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weightI32[5120, 17920]
-
blk.7.attn_k.weightI32[5120, 1280]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.7.attn_q.weightI32[5120, 5120]
-
blk.7.attn_v.weightQ4_K[5120, 1280]
-
blk.7.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.7.ffn_gate.weightI32[5120, 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weightI32[5120, 17920]
-
blk.8.attn_k.weightI32[5120, 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.8.attn_q.weightI32[5120, 5120]
-
blk.8.attn_v.weightQ4_K[5120, 1280]
-
blk.8.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.8.ffn_gate.weightI32[5120, 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weightI32[5120, 17920]
-
blk.9.attn_k.weightI32[5120, 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.9.attn_q.weightI32[5120, 5120]
-
blk.9.attn_v.weightQ4_K[5120, 1280]
-
blk.9.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.9.ffn_gate.weightI32[5120, 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weightI32[5120, 17920]
-
blk.10.attn_k.weightI32[5120, 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.10.attn_q.weightI32[5120, 5120]
-
blk.10.attn_v.weightQ4_K[5120, 1280]
-
blk.10.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.10.ffn_gate.weightI32[5120, 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weightI32[5120, 17920]
-
blk.11.attn_k.weightI32[5120, 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.11.attn_q.weightI32[5120, 5120]
-
blk.11.attn_v.weightQ4_K[5120, 1280]
-
blk.11.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.11.ffn_gate.weightI32[5120, 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weightI32[5120, 17920]
-
blk.12.attn_k.weightI32[5120, 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.12.attn_q.weightI32[5120, 5120]
-
blk.12.attn_v.weightQ4_K[5120, 1280]
-
blk.12.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.12.ffn_gate.weightI32[5120, 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weightI32[5120, 17920]
-
blk.13.attn_k.weightI32[5120, 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.13.attn_q.weightI32[5120, 5120]
-
blk.13.attn_v.weightQ4_K[5120, 1280]
-
blk.13.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.13.ffn_gate.weightI32[5120, 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weightI32[5120, 17920]
-
blk.14.attn_k.weightI32[5120, 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.14.attn_q.weightI32[5120, 5120]
-
blk.14.attn_v.weightQ4_K[5120, 1280]
-
blk.14.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.14.ffn_gate.weightI32[5120, 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weightI32[5120, 17920]
-
blk.15.attn_k.weightI32[5120, 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.15.attn_q.weightI32[5120, 5120]
-
blk.15.attn_v.weightQ4_K[5120, 1280]
-
blk.15.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.15.ffn_gate.weightI32[5120, 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weightI32[5120, 17920]
-
blk.16.attn_k.weightI32[5120, 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.16.attn_q.weightI32[5120, 5120]
-
blk.16.attn_v.weightQ4_K[5120, 1280]
-
blk.16.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.16.ffn_gate.weightI32[5120, 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weightI32[5120, 17920]
-
blk.17.attn_k.weightI32[5120, 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.17.attn_q.weightI32[5120, 5120]
-
blk.17.attn_v.weightQ4_K[5120, 1280]
-
blk.17.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.17.ffn_gate.weightI32[5120, 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weightI32[5120, 17920]
-
blk.18.attn_k.weightI32[5120, 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.18.attn_q.weightI32[5120, 5120]
-
blk.18.attn_v.weightQ4_K[5120, 1280]
-
blk.18.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.18.ffn_gate.weightI32[5120, 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weightI32[5120, 17920]
-
blk.19.attn_k.weightI32[5120, 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.19.attn_q.weightI32[5120, 5120]
-
blk.19.attn_v.weightQ4_K[5120, 1280]
-
blk.19.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.19.ffn_gate.weightI32[5120, 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weightI32[5120, 17920]
-
blk.20.attn_k.weightI32[5120, 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.20.attn_q.weightI32[5120, 5120]
-
blk.20.attn_v.weightQ4_K[5120, 1280]
-
blk.20.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.20.ffn_gate.weightI32[5120, 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weightI32[5120, 17920]
-
blk.21.attn_k.weightI32[5120, 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.21.attn_q.weightI32[5120, 5120]
-
blk.21.attn_v.weightQ4_K[5120, 1280]
-
blk.21.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.21.ffn_gate.weightI32[5120, 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weightI32[5120, 17920]
-
blk.22.attn_k.weightI32[5120, 1280]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.22.attn_q.weightI32[5120, 5120]
-
blk.22.attn_v.weightQ4_K[5120, 1280]
-
blk.22.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.22.ffn_gate.weightI32[5120, 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weightI32[5120, 17920]
-
blk.23.attn_k.weightI32[5120, 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.23.attn_q.weightI32[5120, 5120]
-
blk.23.attn_v.weightQ4_K[5120, 1280]
-
blk.23.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.23.ffn_gate.weightI32[5120, 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weightI32[5120, 17920]
-
blk.24.attn_k.weightI32[5120, 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.24.attn_q.weightI32[5120, 5120]
-
blk.24.attn_v.weightQ4_K[5120, 1280]
-
blk.24.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.24.ffn_gate.weightI32[5120, 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weightI32[5120, 17920]
-
blk.25.attn_k.weightI32[5120, 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.25.attn_q.weightI32[5120, 5120]
-
blk.25.attn_v.weightQ4_K[5120, 1280]
-
blk.25.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.25.ffn_gate.weightI32[5120, 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weightI32[5120, 17920]
-
blk.26.attn_k.weightI32[5120, 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.26.attn_q.weightI32[5120, 5120]
-
blk.26.attn_v.weightQ4_K[5120, 1280]
-
blk.26.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.26.ffn_gate.weightI32[5120, 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weightI32[5120, 17920]
-
blk.27.attn_k.weightI32[5120, 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.27.attn_q.weightI32[5120, 5120]
-
blk.27.attn_v.weightQ4_K[5120, 1280]
-
blk.27.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.27.ffn_gate.weightI32[5120, 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weightI32[5120, 17920]
-
blk.28.attn_k.weightI32[5120, 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.28.attn_q.weightI32[5120, 5120]
-
blk.28.attn_v.weightQ4_K[5120, 1280]
-
blk.28.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.28.ffn_gate.weightI32[5120, 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weightI32[5120, 17920]
-
blk.29.attn_k.weightI32[5120, 1280]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.29.attn_q.weightI32[5120, 5120]
-
blk.29.attn_v.weightQ4_K[5120, 1280]
-
blk.29.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.29.ffn_gate.weightI32[5120, 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weightI32[5120, 17920]
-
blk.30.attn_k.weightI32[5120, 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.30.attn_q.weightI32[5120, 5120]
-
blk.30.attn_v.weightQ4_K[5120, 1280]
-
blk.30.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.30.ffn_gate.weightI32[5120, 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weightI32[5120, 17920]
-
blk.31.attn_k.weightI32[5120, 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.31.attn_q.weightI32[5120, 5120]
-
blk.31.attn_v.weightQ4_K[5120, 1280]
-
blk.31.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.31.ffn_gate.weightI32[5120, 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weightI32[5120, 17920]
-
blk.32.attn_k.weightI32[5120, 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.32.attn_q.weightI32[5120, 5120]
-
blk.32.attn_v.weightQ4_K[5120, 1280]
-
blk.32.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.32.ffn_gate.weightI32[5120, 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weightI32[5120, 17920]
-
blk.33.attn_k.weightI32[5120, 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.33.attn_q.weightI32[5120, 5120]
-
blk.33.attn_v.weightQ4_K[5120, 1280]
-
blk.33.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.33.ffn_gate.weightI32[5120, 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weightI32[5120, 17920]
-
blk.34.attn_k.weightI32[5120, 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.34.attn_q.weightI32[5120, 5120]
-
blk.34.attn_v.weightQ4_K[5120, 1280]
-
blk.34.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.34.ffn_gate.weightI32[5120, 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weightI32[5120, 17920]
-
blk.35.attn_k.weightI32[5120, 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.35.attn_q.weightI32[5120, 5120]
-
blk.35.attn_v.weightQ4_K[5120, 1280]
-
blk.35.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.36.attn_k.weightI32[5120, 1280]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.36.attn_q.weightI32[5120, 5120]
-
blk.36.attn_v.weightQ4_K[5120, 1280]
-
blk.36.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.37.attn_k.weightI32[5120, 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.37.attn_q.weightI32[5120, 5120]
-
blk.37.attn_v.weightQ4_K[5120, 1280]
-
blk.37.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.38.attn_k.weightI32[5120, 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.38.attn_q.weightI32[5120, 5120]
-
blk.38.attn_v.weightQ4_K[5120, 1280]
-
blk.38.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
blk.39.attn_k.weightI32[5120, 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 21!)[5120, 5120]
-
blk.39.attn_q.weightI32[5120, 5120]
-
blk.39.attn_v.weightQ4_K[5120, 1280]
-
blk.39.ffn_down.weight(!unknown_type 21!)[17920, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 21!)[5120, 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 21!)[5120, 17920]
-
output.weightQ6_K[5120, 32064]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39