23 Pulls Updated 4 months ago
a9098e8e89e6 · 7.5GB
-
general.architecturephi3
-
general.file_type30
-
general.namePhi3
-
general.quantization_version2
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length131072
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.attn_factor1.1902381
-
phi3.rope.scaling.original_context_length4096
-
quantize.imatrix.chunks_count234
-
quantize.imatrix.dataset/training_data/calibration_data.txt
-
quantize.imatrix.entries_count160
-
quantize.imatrix.file/models/Phi-3-medium-128k-instruct-GGUF/Phi-3-medium-128k-instruct.imatrix
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 4, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[5120, 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.0.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.0.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.1.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.1.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.2.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.2.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.3.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.3.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.4.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.4.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.5.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.5.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.6.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.6.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.7.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.7.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.8.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.8.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.9.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.9.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.10.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.10.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.11.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.11.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.12.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.12.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.13.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.13.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.14.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.14.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.15.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.15.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.16.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.16.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.17.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.17.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.18.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.18.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.19.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.19.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.20.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.20.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.21.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.21.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.22.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.22.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.23.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.23.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.24.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.24.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.25.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.25.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.26.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.26.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.27.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.27.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.28.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.28.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.29.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.29.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.30.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.30.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.31.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.31.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.32.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.32.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.33.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.33.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.34.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.34.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.35.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.35.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.36.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.36.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.37.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.37.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.38.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.38.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.39.attn_qkv.weight(!unknown_type 23!)[5120, 7680]
-
blk.39.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 23!)[5120, 35840]
-
output.weightQ6_K[5120, 32064]
-
rope_factors_long.weightF32[64]
-
rope_factors_short.weightF32[64]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39