A new small LLaVA model fine-tuned from Phi 3 Mini [I-Quants]
vision
1,825 Pulls Updated 7 months ago
bd54fc8eec20 · 1.7GB
-
general.architecturellama
-
general.file_type26
-
general.nameLLaMA v2
-
general.quantization_version2
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length4096
-
llama.embedding_length3072
-
llama.feed_forward_length8192
-
llama.rope.dimension_count96
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count200
-
quantize.imatrix.datasetj:\\work_models\\imatrix\\groups_merged.txt
-
quantize.imatrix.entries_count224
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[3072, 32064]
-
blk.0.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.0.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.0.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.0.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.1.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.1.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.1.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.1.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.2.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.2.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.2.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.2.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.3.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.3.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.3.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.3.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.4.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.4.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.4.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.4.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.5.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.5.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.5.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.5.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.6.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.6.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.6.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.6.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.7.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.7.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.7.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.7.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.8.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.8.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.8.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.8.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.9.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.9.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.9.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.9.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.10.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.10.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.10.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.10.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.10.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.11.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.11.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.11.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.11.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.11.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.12.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.12.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.12.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.12.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.12.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.13.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.13.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.13.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.13.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.13.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.14.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.14.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.14.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.14.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.14.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.15.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.15.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.15.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.15.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.15.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.16.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.16.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.16.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.16.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.16.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.17.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.17.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.17.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.17.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.17.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.18.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.18.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.18.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.18.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.18.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.19.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.19.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.19.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.19.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.19.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.20.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.20.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.20.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.20.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.20.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.21.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.21.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.21.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.21.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.21.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.22.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.22.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.22.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.22.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.22.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.23.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.23.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.23.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.23.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.23.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.24.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.24.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.24.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.24.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.24.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.25.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.25.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.25.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.25.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.25.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.26.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.26.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.26.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.26.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.26.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.27.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.27.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.27.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.27.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.27.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.28.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.28.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.28.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.28.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.28.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.29.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.29.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.29.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.29.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.29.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.30.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.30.attn_norm.weightF32[3072]
-
blk.30.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.30.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.30.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.30.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.30.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.30.ffn_norm.weightF32[3072]
-
blk.30.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
blk.31.attn_k.weight(!unknown_type 21!)[3072, 3072]
-
blk.31.attn_norm.weightF32[3072]
-
blk.31.attn_output.weight(!unknown_type 21!)[3072, 3072]
-
blk.31.attn_q.weight(!unknown_type 21!)[3072, 3072]
-
blk.31.attn_v.weight(!unknown_type 21!)[3072, 3072]
-
blk.31.ffn_down.weight(!unknown_type 21!)[8192, 3072]
-
blk.31.ffn_gate.weight(!unknown_type 21!)[3072, 8192]
-
blk.31.ffn_norm.weightF32[3072]
-
blk.31.ffn_up.weight(!unknown_type 21!)[3072, 8192]
-
output.weightQ6_K[3072, 32064]
-
output_norm.weightF32[3072]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31