bartowski/Phi-3-medium-128k-instruct-GGUF
14B
175 Pulls Updated 4 months ago
d8ed734336b8 · 8.6GB
-
quantize.imatrix.chunks_count234
-
quantize.imatrix.dataset/training_data/calibration_data.txt
-
quantize.imatrix.entries_count160
-
quantize.imatrix.file/models/Phi-3-medium-128k-instruct-GGUF/Phi-3-medium-128k-instruct.imatrix
-
general.architecturephi3
-
general.file_typeQ4_K_M
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length131072
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.attn_factor1.1902381
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[17920 5120]
-
blk.0.ffn_up.weightQ4_K[5120 35840]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.attn_qkv.weightQ5_K[5120 7680]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[17920 5120]
-
blk.1.ffn_up.weightQ4_K[5120 35840]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.attn_qkv.weightQ5_K[5120 7680]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[17920 5120]
-
blk.2.ffn_up.weightQ4_K[5120 35840]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.attn_qkv.weightQ5_K[5120 7680]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ6_K[17920 5120]
-
blk.3.ffn_up.weightQ4_K[5120 35840]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.attn_qkv.weightQ5_K[5120 7680]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[17920 5120]
-
blk.4.ffn_up.weightQ4_K[5120 35840]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.attn_qkv.weightQ5_K[5120 7680]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_K[17920 5120]
-
blk.5.ffn_up.weightQ4_K[5120 35840]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.ffn_up.weightQ4_K[5120 35840]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ6_K[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_K[17920 5120]
-
blk.7.ffn_up.weightQ4_K[5120 35840]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.attn_qkv.weightQ5_K[5120 7680]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_K[17920 5120]
-
blk.8.ffn_up.weightQ4_K[5120 35840]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.attn_qkv.weightQ5_K[5120 7680]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ6_K[17920 5120]
-
blk.9.ffn_up.weightQ4_K[5120 35840]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.attn_qkv.weightQ5_K[5120 7680]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_K[17920 5120]
-
blk.10.ffn_up.weightQ4_K[5120 35840]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.attn_qkv.weightQ5_K[5120 7680]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[17920 5120]
-
blk.11.ffn_up.weightQ4_K[5120 35840]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.attn_qkv.weightQ5_K[5120 7680]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ4_K[17920 5120]
-
blk.12.ffn_up.weightQ4_K[5120 35840]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.attn_qkv.weightQ5_K[5120 7680]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_K[17920 5120]
-
blk.13.ffn_up.weightQ4_K[5120 35840]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.attn_qkv.weightQ5_K[5120 7680]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_K[17920 5120]
-
blk.14.ffn_up.weightQ4_K[5120 35840]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.attn_qkv.weightQ5_K[5120 7680]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_K[17920 5120]
-
blk.15.ffn_up.weightQ4_K[5120 35840]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.attn_qkv.weightQ5_K[5120 7680]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ6_K[17920 5120]
-
blk.16.ffn_up.weightQ4_K[5120 35840]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.attn_qkv.weightQ5_K[5120 7680]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_K[17920 5120]
-
blk.17.ffn_up.weightQ4_K[5120 35840]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.attn_qkv.weightQ5_K[5120 7680]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_K[17920 5120]
-
blk.18.ffn_up.weightQ4_K[5120 35840]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.attn_qkv.weightQ5_K[5120 7680]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ6_K[17920 5120]
-
blk.19.ffn_up.weightQ4_K[5120 35840]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.attn_qkv.weightQ5_K[5120 7680]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_K[17920 5120]
-
blk.20.ffn_up.weightQ4_K[5120 35840]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_K[17920 5120]
-
blk.21.ffn_up.weightQ4_K[5120 35840]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ6_K[17920 5120]
-
blk.22.ffn_up.weightQ4_K[5120 35840]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.attn_qkv.weightQ5_K[5120 7680]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_K[17920 5120]
-
blk.23.ffn_up.weightQ4_K[5120 35840]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.attn_qkv.weightQ5_K[5120 7680]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_K[17920 5120]
-
blk.24.ffn_up.weightQ4_K[5120 35840]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.attn_qkv.weightQ5_K[5120 7680]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ6_K[17920 5120]
-
blk.25.ffn_up.weightQ4_K[5120 35840]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.attn_qkv.weightQ5_K[5120 7680]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_K[17920 5120]
-
blk.26.ffn_up.weightQ4_K[5120 35840]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.attn_qkv.weightQ5_K[5120 7680]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_K[17920 5120]
-
blk.27.ffn_up.weightQ4_K[5120 35840]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ6_K[17920 5120]
-
blk.28.ffn_up.weightQ4_K[5120 35840]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_K[17920 5120]
-
blk.29.ffn_up.weightQ4_K[5120 35840]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.attn_qkv.weightQ5_K[5120 7680]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_K[17920 5120]
-
blk.30.ffn_up.weightQ4_K[5120 35840]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.attn_qkv.weightQ5_K[5120 7680]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[17920 5120]
-
blk.31.ffn_up.weightQ4_K[5120 35840]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.attn_qkv.weightQ5_K[5120 7680]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_K[17920 5120]
-
blk.32.ffn_up.weightQ4_K[5120 35840]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.attn_qkv.weightQ5_K[5120 7680]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_K[17920 5120]
-
blk.33.ffn_up.weightQ4_K[5120 35840]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.attn_qkv.weightQ5_K[5120 7680]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[17920 5120]
-
blk.34.ffn_up.weightQ4_K[5120 35840]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[17920 5120]
-
blk.35.ffn_up.weightQ4_K[5120 35840]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ6_K[17920 5120]
-
blk.36.ffn_up.weightQ4_K[5120 35840]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.attn_qkv.weightQ5_K[5120 7680]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[17920 5120]
-
blk.37.ffn_up.weightQ4_K[5120 35840]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.attn_qkv.weightQ5_K[5120 7680]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[17920 5120]
-
blk.38.ffn_up.weightQ4_K[5120 35840]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.attn_qkv.weightQ5_K[5120 7680]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ6_K[17920 5120]
-
blk.39.ffn_up.weightQ4_K[5120 35840]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.attn_qkv.weightQ5_K[5120 7680]
-
output.weightQ6_K[5120 32064]
-
output_norm.weightF32[5120]
-
rope_factors_long.weightF32[64]
-
rope_factors_short.weightF32[64]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39