Phi-3 Mini is a lightweight 3B state-of-the-art open models by Microsoft. Updated in July 2024.
241 Pulls Updated 4 months ago
f04e265f53f7 · 2.1GB
-
general.architecturephi3
-
general.file_type30
-
general.namePhi3
-
general.quantization_version2
-
phi3.attention.head_count32
-
phi3.attention.head_count_kv32
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count32
-
phi3.context_length4096
-
phi3.embedding_length3072
-
phi3.feed_forward_length8192
-
phi3.rope.dimension_count96
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.original_context_length4096
-
quantize.imatrix.chunks_count148
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count128
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 4, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[3072, 32064]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.0.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.0.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.1.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.1.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.2.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.2.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.3.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.3.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.4.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.4.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.5.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.5.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.6.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.6.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.7.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.7.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.8.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.8.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.9.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.9.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.10.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.10.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.11.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.11.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.12.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.12.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.13.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.13.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.14.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.14.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.15.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.15.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.16.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.16.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.17.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.17.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.18.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.18.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.19.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.19.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.20.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.20.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.21.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.21.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.22.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.22.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.23.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.23.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.24.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.24.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.25.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.25.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.26.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.26.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.27.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.27.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.28.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.28.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.29.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.29.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.30.attn_norm.weightF32[3072]
-
blk.30.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.30.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.30.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.30.ffn_norm.weightF32[3072]
-
blk.30.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
blk.31.attn_norm.weightF32[3072]
-
blk.31.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.31.attn_qkv.weight(!unknown_type 23!)[3072, 9216]
-
blk.31.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.31.ffn_norm.weightF32[3072]
-
blk.31.ffn_up.weight(!unknown_type 23!)[3072, 16384]
-
output.weightQ6_K[3072, 32064]
-
output_norm.weightF32[3072]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31