A new small LLaVA model fine-tuned from Phi 3 Mini [I-Quants]
vision
1,798 Pulls Updated 5 months ago
e6dff3cd6204 · 2.1GB
-
general.architecturellama
-
general.file_type30
-
general.nameLLaMA v2
-
general.quantization_version2
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length4096
-
llama.embedding_length3072
-
llama.feed_forward_length8192
-
llama.rope.dimension_count96
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count200
-
quantize.imatrix.datasetj:\\work_models\\imatrix\\groups_merged.txt
-
quantize.imatrix.entries_count224
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[3072, 32064]
-
blk.0.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.0.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.0.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.0.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.1.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.1.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.1.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.1.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.2.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.2.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.2.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.2.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.3.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.3.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.3.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.3.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.4.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.4.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.4.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.4.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.5.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.5.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.5.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.5.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.6.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.6.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.6.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.6.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.7.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.7.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.7.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.7.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.8.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.8.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.8.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.8.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.9.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.9.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.9.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.9.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.10.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.10.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.10.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.10.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.11.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.11.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.11.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.11.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.12.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.12.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.12.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.12.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.13.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.13.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.13.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.13.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.14.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.14.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.14.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.14.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.15.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.15.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.15.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.15.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.16.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.16.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.16.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.16.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.17.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.17.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.17.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.17.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.18.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.18.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.18.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.18.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.19.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.19.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.19.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.19.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.20.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.20.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.20.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.20.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.21.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.21.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.21.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.21.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.22.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.22.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.22.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.22.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.23.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.23.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.23.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.23.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.24.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.24.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.24.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.24.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.25.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.25.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.25.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.25.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.26.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.26.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.26.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.26.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.27.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.27.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.27.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.27.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.28.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.28.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.28.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.28.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.29.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.29.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.29.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.29.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.30.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.30.attn_norm.weightF32[3072]
-
blk.30.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.30.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.30.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.30.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.30.ffn_norm.weightF32[3072]
-
blk.30.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
blk.31.attn_k.weight(!unknown_type 23!)[3072, 3072]
-
blk.31.attn_norm.weightF32[3072]
-
blk.31.attn_output.weight(!unknown_type 23!)[3072, 3072]
-
blk.31.attn_q.weight(!unknown_type 23!)[3072, 3072]
-
blk.31.attn_v.weight(!unknown_type 23!)[3072, 3072]
-
blk.31.ffn_down.weight(!unknown_type 23!)[8192, 3072]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[3072, 8192]
-
blk.31.ffn_norm.weightF32[3072]
-
blk.31.ffn_up.weight(!unknown_type 23!)[3072, 8192]
-
output.weightQ6_K[3072, 32064]
-
output_norm.weightF32[3072]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31