A new small LLaVA model fine-tuned from Phi 3 Mini [I-Quants]
vision
1,798 Pulls Updated 5 months ago
ce2375a6e537 · 1.5GB
-
general.architecturellama
-
general.file_type23
-
general.nameLLaMA v2
-
general.quantization_version2
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length4096
-
llama.embedding_length3072
-
llama.feed_forward_length8192
-
llama.rope.dimension_count96
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count200
-
quantize.imatrix.datasetj:\\work_models\\imatrix\\groups_merged.txt
-
quantize.imatrix.entries_count224
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[3072, 32064]
-
blk.0.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.0.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.0.attn_v.weightI32[3072, 3072]
-
blk.0.ffn_down.weightI32[8192, 3072]
-
blk.0.ffn_gate.weightI32[3072, 8192]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.ffn_up.weightI32[3072, 8192]
-
blk.1.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.1.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.1.attn_v.weightI32[3072, 3072]
-
blk.1.ffn_down.weightI32[8192, 3072]
-
blk.1.ffn_gate.weightI32[3072, 8192]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.ffn_up.weightI32[3072, 8192]
-
blk.2.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.2.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.2.attn_v.weightI32[3072, 3072]
-
blk.2.ffn_down.weightI32[8192, 3072]
-
blk.2.ffn_gate.weightI32[3072, 8192]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.ffn_up.weightI32[3072, 8192]
-
blk.3.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.3.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.3.attn_v.weightI32[3072, 3072]
-
blk.3.ffn_down.weightI32[8192, 3072]
-
blk.3.ffn_gate.weightI32[3072, 8192]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.ffn_up.weightI32[3072, 8192]
-
blk.4.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.4.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.4.attn_v.weightI32[3072, 3072]
-
blk.4.ffn_down.weightI32[8192, 3072]
-
blk.4.ffn_gate.weightI32[3072, 8192]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.ffn_up.weightI32[3072, 8192]
-
blk.5.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.5.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.5.attn_v.weightI32[3072, 3072]
-
blk.5.ffn_down.weightI32[8192, 3072]
-
blk.5.ffn_gate.weightI32[3072, 8192]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.ffn_up.weightI32[3072, 8192]
-
blk.6.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.6.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.6.attn_v.weightI32[3072, 3072]
-
blk.6.ffn_down.weightI32[8192, 3072]
-
blk.6.ffn_gate.weightI32[3072, 8192]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.ffn_up.weightI32[3072, 8192]
-
blk.7.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.7.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.7.attn_v.weightI32[3072, 3072]
-
blk.7.ffn_down.weightI32[8192, 3072]
-
blk.7.ffn_gate.weightI32[3072, 8192]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.ffn_up.weightI32[3072, 8192]
-
blk.8.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.8.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.8.attn_v.weightI32[3072, 3072]
-
blk.8.ffn_down.weightI32[8192, 3072]
-
blk.8.ffn_gate.weightI32[3072, 8192]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.ffn_up.weightI32[3072, 8192]
-
blk.9.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.9.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.9.attn_v.weightI32[3072, 3072]
-
blk.9.ffn_down.weightI32[8192, 3072]
-
blk.9.ffn_gate.weightI32[3072, 8192]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.ffn_up.weightI32[3072, 8192]
-
blk.10.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.10.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.10.attn_v.weightI32[3072, 3072]
-
blk.10.ffn_down.weightI32[8192, 3072]
-
blk.10.ffn_gate.weightI32[3072, 8192]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.ffn_up.weightI32[3072, 8192]
-
blk.11.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.11.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.11.attn_v.weightI32[3072, 3072]
-
blk.11.ffn_down.weightI32[8192, 3072]
-
blk.11.ffn_gate.weightI32[3072, 8192]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.ffn_up.weightI32[3072, 8192]
-
blk.12.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.12.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.12.attn_v.weightI32[3072, 3072]
-
blk.12.ffn_down.weightI32[8192, 3072]
-
blk.12.ffn_gate.weightI32[3072, 8192]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.ffn_up.weightI32[3072, 8192]
-
blk.13.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.13.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.13.attn_v.weightI32[3072, 3072]
-
blk.13.ffn_down.weightI32[8192, 3072]
-
blk.13.ffn_gate.weightI32[3072, 8192]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.ffn_up.weightI32[3072, 8192]
-
blk.14.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.14.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.14.attn_v.weightI32[3072, 3072]
-
blk.14.ffn_down.weightI32[8192, 3072]
-
blk.14.ffn_gate.weightI32[3072, 8192]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.ffn_up.weightI32[3072, 8192]
-
blk.15.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.15.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.15.attn_v.weightI32[3072, 3072]
-
blk.15.ffn_down.weightI32[8192, 3072]
-
blk.15.ffn_gate.weightI32[3072, 8192]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.ffn_up.weightI32[3072, 8192]
-
blk.16.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.16.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.16.attn_v.weightI32[3072, 3072]
-
blk.16.ffn_down.weightI32[8192, 3072]
-
blk.16.ffn_gate.weightI32[3072, 8192]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.ffn_up.weightI32[3072, 8192]
-
blk.17.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.17.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.17.attn_v.weightI32[3072, 3072]
-
blk.17.ffn_down.weightI32[8192, 3072]
-
blk.17.ffn_gate.weightI32[3072, 8192]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.ffn_up.weightI32[3072, 8192]
-
blk.18.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.18.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.18.attn_v.weightI32[3072, 3072]
-
blk.18.ffn_down.weightI32[8192, 3072]
-
blk.18.ffn_gate.weightI32[3072, 8192]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.ffn_up.weightI32[3072, 8192]
-
blk.19.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.19.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.19.attn_v.weightI32[3072, 3072]
-
blk.19.ffn_down.weightI32[8192, 3072]
-
blk.19.ffn_gate.weightI32[3072, 8192]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.ffn_up.weightI32[3072, 8192]
-
blk.20.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.20.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.20.attn_v.weightI32[3072, 3072]
-
blk.20.ffn_down.weightI32[8192, 3072]
-
blk.20.ffn_gate.weightI32[3072, 8192]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.ffn_up.weightI32[3072, 8192]
-
blk.21.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.21.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.21.attn_v.weightI32[3072, 3072]
-
blk.21.ffn_down.weightI32[8192, 3072]
-
blk.21.ffn_gate.weightI32[3072, 8192]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.ffn_up.weightI32[3072, 8192]
-
blk.22.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.22.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.22.attn_v.weightI32[3072, 3072]
-
blk.22.ffn_down.weightI32[8192, 3072]
-
blk.22.ffn_gate.weightI32[3072, 8192]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.ffn_up.weightI32[3072, 8192]
-
blk.23.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.23.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.23.attn_v.weightI32[3072, 3072]
-
blk.23.ffn_down.weightI32[8192, 3072]
-
blk.23.ffn_gate.weightI32[3072, 8192]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.ffn_up.weightI32[3072, 8192]
-
blk.24.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.24.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.24.attn_v.weightI32[3072, 3072]
-
blk.24.ffn_down.weightI32[8192, 3072]
-
blk.24.ffn_gate.weightI32[3072, 8192]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.ffn_up.weightI32[3072, 8192]
-
blk.25.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.25.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.25.attn_v.weightI32[3072, 3072]
-
blk.25.ffn_down.weightI32[8192, 3072]
-
blk.25.ffn_gate.weightI32[3072, 8192]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.ffn_up.weightI32[3072, 8192]
-
blk.26.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.26.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.26.attn_v.weightI32[3072, 3072]
-
blk.26.ffn_down.weightI32[8192, 3072]
-
blk.26.ffn_gate.weightI32[3072, 8192]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.ffn_up.weightI32[3072, 8192]
-
blk.27.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.27.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.27.attn_v.weightI32[3072, 3072]
-
blk.27.ffn_down.weightI32[8192, 3072]
-
blk.27.ffn_gate.weightI32[3072, 8192]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.ffn_up.weightI32[3072, 8192]
-
blk.28.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.28.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.28.attn_v.weightI32[3072, 3072]
-
blk.28.ffn_down.weightI32[8192, 3072]
-
blk.28.ffn_gate.weightI32[3072, 8192]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.ffn_up.weightI32[3072, 8192]
-
blk.29.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.29.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.29.attn_v.weightI32[3072, 3072]
-
blk.29.ffn_down.weightI32[8192, 3072]
-
blk.29.ffn_gate.weightI32[3072, 8192]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.ffn_up.weightI32[3072, 8192]
-
blk.30.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.30.attn_norm.weightF32[3072]
-
blk.30.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.30.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.30.attn_v.weightI32[3072, 3072]
-
blk.30.ffn_down.weightI32[8192, 3072]
-
blk.30.ffn_gate.weightI32[3072, 8192]
-
blk.30.ffn_norm.weightF32[3072]
-
blk.30.ffn_up.weightI32[3072, 8192]
-
blk.31.attn_k.weight(!unknown_type 22!)[3072, 3072]
-
blk.31.attn_norm.weightF32[3072]
-
blk.31.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.31.attn_q.weight(!unknown_type 22!)[3072, 3072]
-
blk.31.attn_v.weightI32[3072, 3072]
-
blk.31.ffn_down.weightI32[8192, 3072]
-
blk.31.ffn_gate.weightI32[3072, 8192]
-
blk.31.ffn_norm.weightF32[3072]
-
blk.31.ffn_up.weightI32[3072, 8192]
-
output.weightQ5_K[3072, 32064]
-
output_norm.weightF32[3072]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31