latest
15GB
14B
14 Pulls Updated 3 months ago
93521adb7e4a · 15GB
-
general.architecturephi3
-
general.file_typeQ8_0
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length4096
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ8_0[5120 32064]
-
blk.0.attn_output.weightQ8_0[5120 5120]
-
blk.0.attn_qkv.weightQ8_0[5120 7680]
-
blk.0.ffn_up.weightQ8_0[5120 35840]
-
blk.0.ffn_down.weightQ8_0[17920 5120]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ8_0[5120 5120]
-
blk.1.attn_qkv.weightQ8_0[5120 7680]
-
blk.1.ffn_up.weightQ8_0[5120 35840]
-
blk.1.ffn_down.weightQ8_0[17920 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ8_0[5120 5120]
-
blk.2.attn_qkv.weightQ8_0[5120 7680]
-
blk.2.ffn_up.weightQ8_0[5120 35840]
-
blk.2.ffn_down.weightQ8_0[17920 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ8_0[5120 5120]
-
blk.3.attn_qkv.weightQ8_0[5120 7680]
-
blk.3.ffn_up.weightQ8_0[5120 35840]
-
blk.3.ffn_down.weightQ8_0[17920 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ8_0[5120 5120]
-
blk.4.attn_qkv.weightQ8_0[5120 7680]
-
blk.4.ffn_up.weightQ8_0[5120 35840]
-
blk.4.ffn_down.weightQ8_0[17920 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ8_0[5120 5120]
-
blk.5.attn_qkv.weightQ8_0[5120 7680]
-
blk.5.ffn_up.weightQ8_0[5120 35840]
-
blk.5.ffn_down.weightQ8_0[17920 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.6.attn_output.weightQ8_0[5120 5120]
-
blk.6.attn_qkv.weightQ8_0[5120 7680]
-
blk.6.ffn_up.weightQ8_0[5120 35840]
-
blk.6.ffn_down.weightQ8_0[17920 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ8_0[5120 5120]
-
blk.7.attn_qkv.weightQ8_0[5120 7680]
-
blk.7.ffn_up.weightQ8_0[5120 35840]
-
blk.7.ffn_down.weightQ8_0[17920 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ8_0[5120 5120]
-
blk.8.attn_qkv.weightQ8_0[5120 7680]
-
blk.8.ffn_up.weightQ8_0[5120 35840]
-
blk.8.ffn_down.weightQ8_0[17920 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ8_0[5120 5120]
-
blk.9.attn_qkv.weightQ8_0[5120 7680]
-
blk.9.ffn_up.weightQ8_0[5120 35840]
-
blk.9.ffn_down.weightQ8_0[17920 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ8_0[5120 5120]
-
blk.10.attn_qkv.weightQ8_0[5120 7680]
-
blk.10.ffn_up.weightQ8_0[5120 35840]
-
blk.10.ffn_down.weightQ8_0[17920 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ8_0[5120 5120]
-
blk.11.attn_qkv.weightQ8_0[5120 7680]
-
blk.11.ffn_up.weightQ8_0[5120 35840]
-
blk.11.ffn_down.weightQ8_0[17920 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ8_0[5120 5120]
-
blk.12.attn_qkv.weightQ8_0[5120 7680]
-
blk.12.ffn_up.weightQ8_0[5120 35840]
-
blk.12.ffn_down.weightQ8_0[17920 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ8_0[5120 5120]
-
blk.13.attn_qkv.weightQ8_0[5120 7680]
-
blk.13.ffn_up.weightQ8_0[5120 35840]
-
blk.13.ffn_down.weightQ8_0[17920 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ8_0[5120 5120]
-
blk.14.attn_qkv.weightQ8_0[5120 7680]
-
blk.14.ffn_up.weightQ8_0[5120 35840]
-
blk.14.ffn_down.weightQ8_0[17920 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ8_0[5120 5120]
-
blk.15.attn_qkv.weightQ8_0[5120 7680]
-
blk.15.ffn_up.weightQ8_0[5120 35840]
-
blk.15.ffn_down.weightQ8_0[17920 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ8_0[5120 5120]
-
blk.16.attn_qkv.weightQ8_0[5120 7680]
-
blk.16.ffn_up.weightQ8_0[5120 35840]
-
blk.16.ffn_down.weightQ8_0[17920 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ8_0[5120 5120]
-
blk.17.attn_qkv.weightQ8_0[5120 7680]
-
blk.17.ffn_up.weightQ8_0[5120 35840]
-
blk.17.ffn_down.weightQ8_0[17920 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ8_0[5120 5120]
-
blk.18.attn_qkv.weightQ8_0[5120 7680]
-
blk.18.ffn_up.weightQ8_0[5120 35840]
-
blk.18.ffn_down.weightQ8_0[17920 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ8_0[5120 5120]
-
blk.19.attn_qkv.weightQ8_0[5120 7680]
-
blk.19.ffn_up.weightQ8_0[5120 35840]
-
blk.19.ffn_down.weightQ8_0[17920 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ8_0[5120 5120]
-
blk.20.attn_qkv.weightQ8_0[5120 7680]
-
blk.20.ffn_up.weightQ8_0[5120 35840]
-
blk.20.ffn_down.weightQ8_0[17920 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.21.attn_output.weightQ8_0[5120 5120]
-
blk.21.attn_qkv.weightQ8_0[5120 7680]
-
blk.21.ffn_up.weightQ8_0[5120 35840]
-
blk.21.ffn_down.weightQ8_0[17920 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ8_0[5120 5120]
-
blk.22.attn_qkv.weightQ8_0[5120 7680]
-
blk.22.ffn_up.weightQ8_0[5120 35840]
-
blk.22.ffn_down.weightQ8_0[17920 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ8_0[5120 5120]
-
blk.23.attn_qkv.weightQ8_0[5120 7680]
-
blk.23.ffn_up.weightQ8_0[5120 35840]
-
blk.23.ffn_down.weightQ8_0[17920 5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ8_0[5120 5120]
-
blk.24.attn_qkv.weightQ8_0[5120 7680]
-
blk.24.ffn_up.weightQ8_0[5120 35840]
-
blk.24.ffn_down.weightQ8_0[17920 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ8_0[5120 5120]
-
blk.25.attn_qkv.weightQ8_0[5120 7680]
-
blk.25.ffn_up.weightQ8_0[5120 35840]
-
blk.25.ffn_down.weightQ8_0[17920 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ8_0[5120 5120]
-
blk.26.attn_qkv.weightQ8_0[5120 7680]
-
blk.26.ffn_up.weightQ8_0[5120 35840]
-
blk.26.ffn_down.weightQ8_0[17920 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ8_0[5120 5120]
-
blk.27.attn_qkv.weightQ8_0[5120 7680]
-
blk.27.ffn_up.weightQ8_0[5120 35840]
-
blk.27.ffn_down.weightQ8_0[17920 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.28.attn_output.weightQ8_0[5120 5120]
-
blk.28.attn_qkv.weightQ8_0[5120 7680]
-
blk.28.ffn_up.weightQ8_0[5120 35840]
-
blk.28.ffn_down.weightQ8_0[17920 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ8_0[5120 5120]
-
blk.29.attn_qkv.weightQ8_0[5120 7680]
-
blk.29.ffn_up.weightQ8_0[5120 35840]
-
blk.29.ffn_down.weightQ8_0[17920 5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ8_0[5120 5120]
-
blk.30.attn_qkv.weightQ8_0[5120 7680]
-
blk.30.ffn_up.weightQ8_0[5120 35840]
-
blk.30.ffn_down.weightQ8_0[17920 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ8_0[5120 5120]
-
blk.31.attn_qkv.weightQ8_0[5120 7680]
-
blk.31.ffn_up.weightQ8_0[5120 35840]
-
blk.31.ffn_down.weightQ8_0[17920 5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ8_0[5120 5120]
-
blk.32.attn_qkv.weightQ8_0[5120 7680]
-
blk.32.ffn_up.weightQ8_0[5120 35840]
-
blk.32.ffn_down.weightQ8_0[17920 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ8_0[5120 5120]
-
blk.33.attn_qkv.weightQ8_0[5120 7680]
-
blk.33.ffn_up.weightQ8_0[5120 35840]
-
blk.33.ffn_down.weightQ8_0[17920 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ8_0[5120 5120]
-
blk.34.attn_qkv.weightQ8_0[5120 7680]
-
blk.34.ffn_up.weightQ8_0[5120 35840]
-
blk.34.ffn_down.weightQ8_0[17920 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.35.attn_output.weightQ8_0[5120 5120]
-
blk.35.attn_qkv.weightQ8_0[5120 7680]
-
blk.35.ffn_up.weightQ8_0[5120 35840]
-
blk.35.ffn_down.weightQ8_0[17920 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ8_0[5120 5120]
-
blk.36.attn_qkv.weightQ8_0[5120 7680]
-
blk.36.ffn_up.weightQ8_0[5120 35840]
-
blk.36.ffn_down.weightQ8_0[17920 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ8_0[5120 5120]
-
blk.37.attn_qkv.weightQ8_0[5120 7680]
-
blk.37.ffn_up.weightQ8_0[5120 35840]
-
blk.37.ffn_down.weightQ8_0[17920 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ8_0[5120 5120]
-
blk.38.attn_qkv.weightQ8_0[5120 7680]
-
blk.38.ffn_up.weightQ8_0[5120 35840]
-
blk.38.ffn_down.weightQ8_0[17920 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ8_0[5120 5120]
-
blk.39.attn_qkv.weightQ8_0[5120 7680]
-
blk.39.ffn_up.weightQ8_0[5120 35840]
-
blk.39.ffn_down.weightQ8_0[17920 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_norm.weightF32[5120]
-
output_norm.weightF32[5120]
-
output.weightQ8_0[5120 32064]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39