latest
21GB
Vision
70 Pulls Updated 3 days ago
c63d594da379 · 1.9GB
-
general.architecturemllama
-
general.file_typeF16
-
mllama.vision.attention.head_count16
-
mllama.vision.attention.layer_norm_epsilon1e-05
-
mllama.vision.block_count32
-
mllama.vision.embedding_length1280
-
mllama.vision.feed_forward_length5120
-
mllama.vision.global.block_count8
-
mllama.vision.image_size560
-
mllama.vision.intermediate_layers_indices3
-
mllama.vision.max_num_tiles4
-
mllama.vision.num_channels3
-
mllama.vision.patch_size14
-
mllama.vision.projection_dim4096
-
NameTypeShape
-
v.class_embdF32[1280]
-
v.patch_embd.weightF16[14 14 3 1280]
-
v.tile_position_embd.gateF32[1]
-
v.position_embd.gateF32[1]
-
v.position_embd.weightF16[1280 1601]
-
v.tile_position_embd.weightF32[8197120 9]
-
v.pre_tile_position_embd.gateF32[1]
-
v.pre_tile_position_embd.weightF32[5120 9]
-
v.post_tile_position_embd.gateF32[1]
-
v.post_tile_position_embd.weightF32[5120 9]
-
v.blk.0.attn_q.weightF16[1280 1280]
-
v.blk.0.attn_k.weightF16[1280 1280]
-
v.blk.0.attn_v.weightF16[1280 1280]
-
v.blk.0.attn_out.weightF16[1280 1280]
-
v.blk.0.ffn_down.weightF16[1280 5120]
-
v.blk.0.ffn_down.biasF32[5120]
-
v.blk.0.ffn_up.weightF16[5120 1280]
-
v.blk.0.ffn_up.biasF32[1280]
-
v.blk.0.ln1.weightF32[1280]
-
v.blk.0.ln1.biasF32[1280]
-
v.blk.0.ln2.weightF32[1280]
-
v.blk.0.ln2.biasF32[1280]
-
v.global.blk.0.attn_gateF32[1]
-
v.global.blk.0.ffn_gateF32[1]
-
v.global.blk.0.attn_q.weightF16[1280 1280]
-
v.global.blk.0.attn_k.weightF16[1280 1280]
-
v.global.blk.0.attn_v.weightF16[1280 1280]
-
v.global.blk.0.attn_out.weightF16[1280 1280]
-
v.global.blk.0.ffn_down.weightF16[1280 5120]
-
v.global.blk.0.ffn_down.biasF32[5120]
-
v.global.blk.0.ffn_up.weightF16[5120 1280]
-
v.global.blk.0.ffn_up.biasF32[1280]
-
v.global.blk.0.ln1.weightF32[1280]
-
v.global.blk.0.ln1.biasF32[1280]
-
v.global.blk.0.ln2.weightF32[1280]
-
v.global.blk.0.ln2.biasF32[1280]
-
v.blk.1.attn_q.weightF16[1280 1280]
-
v.blk.1.attn_k.weightF16[1280 1280]
-
v.blk.1.attn_v.weightF16[1280 1280]
-
v.blk.1.attn_out.weightF16[1280 1280]
-
v.blk.1.ffn_down.weightF16[1280 5120]
-
v.blk.1.ffn_down.biasF32[5120]
-
v.blk.1.ffn_up.weightF16[5120 1280]
-
v.blk.1.ffn_up.biasF32[1280]
-
v.blk.1.ln1.weightF32[1280]
-
v.blk.1.ln1.biasF32[1280]
-
v.blk.1.ln2.weightF32[1280]
-
v.blk.1.ln2.biasF32[1280]
-
v.global.blk.1.attn_gateF32[1]
-
v.global.blk.1.ffn_gateF32[1]
-
v.global.blk.1.attn_q.weightF16[1280 1280]
-
v.global.blk.1.attn_k.weightF16[1280 1280]
-
v.global.blk.1.attn_v.weightF16[1280 1280]
-
v.global.blk.1.attn_out.weightF16[1280 1280]
-
v.global.blk.1.ffn_down.weightF16[1280 5120]
-
v.global.blk.1.ffn_down.biasF32[5120]
-
v.global.blk.1.ffn_up.weightF16[5120 1280]
-
v.global.blk.1.ffn_up.biasF32[1280]
-
v.global.blk.1.ln1.weightF32[1280]
-
v.global.blk.1.ln1.biasF32[1280]
-
v.global.blk.1.ln2.weightF32[1280]
-
v.global.blk.1.ln2.biasF32[1280]
-
v.blk.2.attn_q.weightF16[1280 1280]
-
v.blk.2.attn_k.weightF16[1280 1280]
-
v.blk.2.attn_v.weightF16[1280 1280]
-
v.blk.2.attn_out.weightF16[1280 1280]
-
v.blk.2.ffn_down.weightF16[1280 5120]
-
v.blk.2.ffn_down.biasF32[5120]
-
v.blk.2.ffn_up.weightF16[5120 1280]
-
v.blk.2.ffn_up.biasF32[1280]
-
v.blk.2.ln1.weightF32[1280]
-
v.blk.2.ln1.biasF32[1280]
-
v.blk.2.ln2.weightF32[1280]
-
v.blk.2.ln2.biasF32[1280]
-
v.global.blk.2.attn_gateF32[1]
-
v.global.blk.2.ffn_gateF32[1]
-
v.global.blk.2.attn_q.weightF16[1280 1280]
-
v.global.blk.2.attn_k.weightF16[1280 1280]
-
v.global.blk.2.attn_v.weightF16[1280 1280]
-
v.global.blk.2.attn_out.weightF16[1280 1280]
-
v.global.blk.2.ffn_down.weightF16[1280 5120]
-
v.global.blk.2.ffn_down.biasF32[5120]
-
v.global.blk.2.ffn_up.weightF16[5120 1280]
-
v.global.blk.2.ffn_up.biasF32[1280]
-
v.global.blk.2.ln1.weightF32[1280]
-
v.global.blk.2.ln1.biasF32[1280]
-
v.global.blk.2.ln2.weightF32[1280]
-
v.global.blk.2.ln2.biasF32[1280]
-
v.blk.3.attn_q.weightF16[1280 1280]
-
v.blk.3.attn_k.weightF16[1280 1280]
-
v.blk.3.attn_v.weightF16[1280 1280]
-
v.blk.3.attn_out.weightF16[1280 1280]
-
v.blk.3.ffn_down.weightF16[1280 5120]
-
v.blk.3.ffn_down.biasF32[5120]
-
v.blk.3.ffn_up.weightF16[5120 1280]
-
v.blk.3.ffn_up.biasF32[1280]
-
v.blk.3.ln1.weightF32[1280]
-
v.blk.3.ln1.biasF32[1280]
-
v.blk.3.ln2.weightF32[1280]
-
v.blk.3.ln2.biasF32[1280]
-
v.global.blk.3.attn_gateF32[1]
-
v.global.blk.3.ffn_gateF32[1]
-
v.global.blk.3.attn_q.weightF16[1280 1280]
-
v.global.blk.3.attn_k.weightF16[1280 1280]
-
v.global.blk.3.attn_v.weightF16[1280 1280]
-
v.global.blk.3.attn_out.weightF16[1280 1280]
-
v.global.blk.3.ffn_down.weightF16[1280 5120]
-
v.global.blk.3.ffn_down.biasF32[5120]
-
v.global.blk.3.ffn_up.weightF16[5120 1280]
-
v.global.blk.3.ffn_up.biasF32[1280]
-
v.global.blk.3.ln1.weightF32[1280]
-
v.global.blk.3.ln1.biasF32[1280]
-
v.global.blk.3.ln2.weightF32[1280]
-
v.global.blk.3.ln2.biasF32[1280]
-
v.blk.4.attn_q.weightF16[1280 1280]
-
v.blk.4.attn_k.weightF16[1280 1280]
-
v.blk.4.attn_v.weightF16[1280 1280]
-
v.blk.4.attn_out.weightF16[1280 1280]
-
v.blk.4.ffn_down.weightF16[1280 5120]
-
v.blk.4.ffn_down.biasF32[5120]
-
v.blk.4.ffn_up.weightF16[5120 1280]
-
v.blk.4.ffn_up.biasF32[1280]
-
v.blk.4.ln1.weightF32[1280]
-
v.blk.4.ln1.biasF32[1280]
-
v.blk.4.ln2.weightF32[1280]
-
v.blk.4.ln2.biasF32[1280]
-
v.global.blk.4.attn_gateF32[1]
-
v.global.blk.4.ffn_gateF32[1]
-
v.global.blk.4.attn_q.weightF16[1280 1280]
-
v.global.blk.4.attn_k.weightF16[1280 1280]
-
v.global.blk.4.attn_v.weightF16[1280 1280]
-
v.global.blk.4.attn_out.weightF16[1280 1280]
-
v.global.blk.4.ffn_down.weightF16[1280 5120]
-
v.global.blk.4.ffn_down.biasF32[5120]
-
v.global.blk.4.ffn_up.weightF16[5120 1280]
-
v.global.blk.4.ffn_up.biasF32[1280]
-
v.global.blk.4.ln1.weightF32[1280]
-
v.global.blk.4.ln1.biasF32[1280]
-
v.global.blk.4.ln2.weightF32[1280]
-
v.global.blk.4.ln2.biasF32[1280]
-
v.blk.5.attn_q.weightF16[1280 1280]
-
v.blk.5.attn_k.weightF16[1280 1280]
-
v.blk.5.attn_v.weightF16[1280 1280]
-
v.blk.5.attn_out.weightF16[1280 1280]
-
v.blk.5.ffn_down.weightF16[1280 5120]
-
v.blk.5.ffn_down.biasF32[5120]
-
v.blk.5.ffn_up.weightF16[5120 1280]
-
v.blk.5.ffn_up.biasF32[1280]
-
v.blk.5.ln1.weightF32[1280]
-
v.blk.5.ln1.biasF32[1280]
-
v.blk.5.ln2.weightF32[1280]
-
v.blk.5.ln2.biasF32[1280]
-
v.global.blk.5.attn_gateF32[1]
-
v.global.blk.5.ffn_gateF32[1]
-
v.global.blk.5.attn_q.weightF16[1280 1280]
-
v.global.blk.5.attn_k.weightF16[1280 1280]
-
v.global.blk.5.attn_v.weightF16[1280 1280]
-
v.global.blk.5.attn_out.weightF16[1280 1280]
-
v.global.blk.5.ffn_down.weightF16[1280 5120]
-
v.global.blk.5.ffn_down.biasF32[5120]
-
v.global.blk.5.ffn_up.weightF16[5120 1280]
-
v.global.blk.5.ffn_up.biasF32[1280]
-
v.global.blk.5.ln1.weightF32[1280]
-
v.global.blk.5.ln1.biasF32[1280]
-
v.global.blk.5.ln2.weightF32[1280]
-
v.global.blk.5.ln2.biasF32[1280]
-
v.blk.6.attn_q.weightF16[1280 1280]
-
v.blk.6.attn_k.weightF16[1280 1280]
-
v.blk.6.attn_v.weightF16[1280 1280]
-
v.blk.6.attn_out.weightF16[1280 1280]
-
v.blk.6.ffn_down.weightF16[1280 5120]
-
v.blk.6.ffn_down.biasF32[5120]
-
v.blk.6.ffn_up.weightF16[5120 1280]
-
v.blk.6.ffn_up.biasF32[1280]
-
v.blk.6.ln1.weightF32[1280]
-
v.blk.6.ln1.biasF32[1280]
-
v.blk.6.ln2.weightF32[1280]
-
v.blk.6.ln2.biasF32[1280]
-
v.global.blk.6.attn_gateF32[1]
-
v.global.blk.6.ffn_gateF32[1]
-
v.global.blk.6.attn_q.weightF16[1280 1280]
-
v.global.blk.6.attn_k.weightF16[1280 1280]
-
v.global.blk.6.attn_v.weightF16[1280 1280]
-
v.global.blk.6.attn_out.weightF16[1280 1280]
-
v.global.blk.6.ffn_down.weightF16[1280 5120]
-
v.global.blk.6.ffn_down.biasF32[5120]
-
v.global.blk.6.ffn_up.weightF16[5120 1280]
-
v.global.blk.6.ffn_up.biasF32[1280]
-
v.global.blk.6.ln1.weightF32[1280]
-
v.global.blk.6.ln1.biasF32[1280]
-
v.global.blk.6.ln2.weightF32[1280]
-
v.global.blk.6.ln2.biasF32[1280]
-
v.blk.7.attn_q.weightF16[1280 1280]
-
v.blk.7.attn_k.weightF16[1280 1280]
-
v.blk.7.attn_v.weightF16[1280 1280]
-
v.blk.7.attn_out.weightF16[1280 1280]
-
v.blk.7.ffn_down.weightF16[1280 5120]
-
v.blk.7.ffn_down.biasF32[5120]
-
v.blk.7.ffn_up.weightF16[5120 1280]
-
v.blk.7.ffn_up.biasF32[1280]
-
v.blk.7.ln1.weightF32[1280]
-
v.blk.7.ln1.biasF32[1280]
-
v.blk.7.ln2.weightF32[1280]
-
v.blk.7.ln2.biasF32[1280]
-
v.global.blk.7.attn_gateF32[1]
-
v.global.blk.7.ffn_gateF32[1]
-
v.global.blk.7.attn_q.weightF16[1280 1280]
-
v.global.blk.7.attn_k.weightF16[1280 1280]
-
v.global.blk.7.attn_v.weightF16[1280 1280]
-
v.global.blk.7.attn_out.weightF16[1280 1280]
-
v.global.blk.7.ffn_down.weightF16[1280 5120]
-
v.global.blk.7.ffn_down.biasF32[5120]
-
v.global.blk.7.ffn_up.weightF16[5120 1280]
-
v.global.blk.7.ffn_up.biasF32[1280]
-
v.global.blk.7.ln1.weightF32[1280]
-
v.global.blk.7.ln1.biasF32[1280]
-
v.global.blk.7.ln2.weightF32[1280]
-
v.global.blk.7.ln2.biasF32[1280]
-
v.blk.8.attn_q.weightF16[1280 1280]
-
v.blk.8.attn_k.weightF16[1280 1280]
-
v.blk.8.attn_v.weightF16[1280 1280]
-
v.blk.8.attn_out.weightF16[1280 1280]
-
v.blk.8.ffn_down.weightF16[1280 5120]
-
v.blk.8.ffn_down.biasF32[5120]
-
v.blk.8.ffn_up.weightF16[5120 1280]
-
v.blk.8.ffn_up.biasF32[1280]
-
v.blk.8.ln1.weightF32[1280]
-
v.blk.8.ln1.biasF32[1280]
-
v.blk.8.ln2.weightF32[1280]
-
v.blk.8.ln2.biasF32[1280]
-
v.blk.9.attn_q.weightF16[1280 1280]
-
v.blk.9.attn_k.weightF16[1280 1280]
-
v.blk.9.attn_v.weightF16[1280 1280]
-
v.blk.9.attn_out.weightF16[1280 1280]
-
v.blk.9.ffn_down.weightF16[1280 5120]
-
v.blk.9.ffn_down.biasF32[5120]
-
v.blk.9.ffn_up.weightF16[5120 1280]
-
v.blk.9.ffn_up.biasF32[1280]
-
v.blk.9.ln1.weightF32[1280]
-
v.blk.9.ln1.biasF32[1280]
-
v.blk.9.ln2.weightF32[1280]
-
v.blk.9.ln2.biasF32[1280]
-
v.blk.10.attn_q.weightF16[1280 1280]
-
v.blk.10.attn_k.weightF16[1280 1280]
-
v.blk.10.attn_v.weightF16[1280 1280]
-
v.blk.10.attn_out.weightF16[1280 1280]
-
v.blk.10.ffn_down.weightF16[1280 5120]
-
v.blk.10.ffn_down.biasF32[5120]
-
v.blk.10.ffn_up.weightF16[5120 1280]
-
v.blk.10.ffn_up.biasF32[1280]
-
v.blk.10.ln1.weightF32[1280]
-
v.blk.10.ln1.biasF32[1280]
-
v.blk.10.ln2.weightF32[1280]
-
v.blk.10.ln2.biasF32[1280]
-
v.blk.11.attn_q.weightF16[1280 1280]
-
v.blk.11.attn_k.weightF16[1280 1280]
-
v.blk.11.attn_v.weightF16[1280 1280]
-
v.blk.11.attn_out.weightF16[1280 1280]
-
v.blk.11.ffn_down.weightF16[1280 5120]
-
v.blk.11.ffn_down.biasF32[5120]
-
v.blk.11.ffn_up.weightF16[5120 1280]
-
v.blk.11.ffn_up.biasF32[1280]
-
v.blk.11.ln1.weightF32[1280]
-
v.blk.11.ln1.biasF32[1280]
-
v.blk.11.ln2.weightF32[1280]
-
v.blk.11.ln2.biasF32[1280]
-
v.blk.12.attn_q.weightF16[1280 1280]
-
v.blk.12.attn_k.weightF16[1280 1280]
-
v.blk.12.attn_v.weightF16[1280 1280]
-
v.blk.12.attn_out.weightF16[1280 1280]
-
v.blk.12.ffn_down.weightF16[1280 5120]
-
v.blk.12.ffn_down.biasF32[5120]
-
v.blk.12.ffn_up.weightF16[5120 1280]
-
v.blk.12.ffn_up.biasF32[1280]
-
v.blk.12.ln1.weightF32[1280]
-
v.blk.12.ln1.biasF32[1280]
-
v.blk.12.ln2.weightF32[1280]
-
v.blk.12.ln2.biasF32[1280]
-
v.blk.13.attn_q.weightF16[1280 1280]
-
v.blk.13.attn_k.weightF16[1280 1280]
-
v.blk.13.attn_v.weightF16[1280 1280]
-
v.blk.13.attn_out.weightF16[1280 1280]
-
v.blk.13.ffn_down.weightF16[1280 5120]
-
v.blk.13.ffn_down.biasF32[5120]
-
v.blk.13.ffn_up.weightF16[5120 1280]
-
v.blk.13.ffn_up.biasF32[1280]
-
v.blk.13.ln1.weightF32[1280]
-
v.blk.13.ln1.biasF32[1280]
-
v.blk.13.ln2.weightF32[1280]
-
v.blk.13.ln2.biasF32[1280]
-
v.blk.14.attn_q.weightF16[1280 1280]
-
v.blk.14.attn_k.weightF16[1280 1280]
-
v.blk.14.attn_v.weightF16[1280 1280]
-
v.blk.14.attn_out.weightF16[1280 1280]
-
v.blk.14.ffn_down.weightF16[1280 5120]
-
v.blk.14.ffn_down.biasF32[5120]
-
v.blk.14.ffn_up.weightF16[5120 1280]
-
v.blk.14.ffn_up.biasF32[1280]
-
v.blk.14.ln1.weightF32[1280]
-
v.blk.14.ln1.biasF32[1280]
-
v.blk.14.ln2.weightF32[1280]
-
v.blk.14.ln2.biasF32[1280]
-
v.blk.15.attn_q.weightF16[1280 1280]
-
v.blk.15.attn_k.weightF16[1280 1280]
-
v.blk.15.attn_v.weightF16[1280 1280]
-
v.blk.15.attn_out.weightF16[1280 1280]
-
v.blk.15.ffn_down.weightF16[1280 5120]
-
v.blk.15.ffn_down.biasF32[5120]
-
v.blk.15.ffn_up.weightF16[5120 1280]
-
v.blk.15.ffn_up.biasF32[1280]
-
v.blk.15.ln1.weightF32[1280]
-
v.blk.15.ln1.biasF32[1280]
-
v.blk.15.ln2.weightF32[1280]
-
v.blk.15.ln2.biasF32[1280]
-
v.blk.16.attn_q.weightF16[1280 1280]
-
v.blk.16.attn_k.weightF16[1280 1280]
-
v.blk.16.attn_v.weightF16[1280 1280]
-
v.blk.16.attn_out.weightF16[1280 1280]
-
v.blk.16.ffn_down.weightF16[1280 5120]
-
v.blk.16.ffn_down.biasF32[5120]
-
v.blk.16.ffn_up.weightF16[5120 1280]
-
v.blk.16.ffn_up.biasF32[1280]
-
v.blk.16.ln1.weightF32[1280]
-
v.blk.16.ln1.biasF32[1280]
-
v.blk.16.ln2.weightF32[1280]
-
v.blk.16.ln2.biasF32[1280]
-
v.blk.17.attn_q.weightF16[1280 1280]
-
v.blk.17.attn_k.weightF16[1280 1280]
-
v.blk.17.attn_v.weightF16[1280 1280]
-
v.blk.17.attn_out.weightF16[1280 1280]
-
v.blk.17.ffn_down.weightF16[1280 5120]
-
v.blk.17.ffn_down.biasF32[5120]
-
v.blk.17.ffn_up.weightF16[5120 1280]
-
v.blk.17.ffn_up.biasF32[1280]
-
v.blk.17.ln1.weightF32[1280]
-
v.blk.17.ln1.biasF32[1280]
-
v.blk.17.ln2.weightF32[1280]
-
v.blk.17.ln2.biasF32[1280]
-
v.blk.18.attn_q.weightF16[1280 1280]
-
v.blk.18.attn_k.weightF16[1280 1280]
-
v.blk.18.attn_v.weightF16[1280 1280]
-
v.blk.18.attn_out.weightF16[1280 1280]
-
v.blk.18.ffn_down.weightF16[1280 5120]
-
v.blk.18.ffn_down.biasF32[5120]
-
v.blk.18.ffn_up.weightF16[5120 1280]
-
v.blk.18.ffn_up.biasF32[1280]
-
v.blk.18.ln1.weightF32[1280]
-
v.blk.18.ln1.biasF32[1280]
-
v.blk.18.ln2.weightF32[1280]
-
v.blk.18.ln2.biasF32[1280]
-
v.blk.19.attn_q.weightF16[1280 1280]
-
v.blk.19.attn_k.weightF16[1280 1280]
-
v.blk.19.attn_v.weightF16[1280 1280]
-
v.blk.19.attn_out.weightF16[1280 1280]
-
v.blk.19.ffn_down.weightF16[1280 5120]
-
v.blk.19.ffn_down.biasF32[5120]
-
v.blk.19.ffn_up.weightF16[5120 1280]
-
v.blk.19.ffn_up.biasF32[1280]
-
v.blk.19.ln1.weightF32[1280]
-
v.blk.19.ln1.biasF32[1280]
-
v.blk.19.ln2.weightF32[1280]
-
v.blk.19.ln2.biasF32[1280]
-
v.blk.20.attn_q.weightF16[1280 1280]
-
v.blk.20.attn_k.weightF16[1280 1280]
-
v.blk.20.attn_v.weightF16[1280 1280]
-
v.blk.20.attn_out.weightF16[1280 1280]
-
v.blk.20.ffn_down.weightF16[1280 5120]
-
v.blk.20.ffn_down.biasF32[5120]
-
v.blk.20.ffn_up.weightF16[5120 1280]
-
v.blk.20.ffn_up.biasF32[1280]
-
v.blk.20.ln1.weightF32[1280]
-
v.blk.20.ln1.biasF32[1280]
-
v.blk.20.ln2.weightF32[1280]
-
v.blk.20.ln2.biasF32[1280]
-
v.blk.21.attn_q.weightF16[1280 1280]
-
v.blk.21.attn_k.weightF16[1280 1280]
-
v.blk.21.attn_v.weightF16[1280 1280]
-
v.blk.21.attn_out.weightF16[1280 1280]
-
v.blk.21.ffn_down.weightF16[1280 5120]
-
v.blk.21.ffn_down.biasF32[5120]
-
v.blk.21.ffn_up.weightF16[5120 1280]
-
v.blk.21.ffn_up.biasF32[1280]
-
v.blk.21.ln1.weightF32[1280]
-
v.blk.21.ln1.biasF32[1280]
-
v.blk.21.ln2.weightF32[1280]
-
v.blk.21.ln2.biasF32[1280]
-
v.blk.22.attn_q.weightF16[1280 1280]
-
v.blk.22.attn_k.weightF16[1280 1280]
-
v.blk.22.attn_v.weightF16[1280 1280]
-
v.blk.22.attn_out.weightF16[1280 1280]
-
v.blk.22.ffn_down.weightF16[1280 5120]
-
v.blk.22.ffn_down.biasF32[5120]
-
v.blk.22.ffn_up.weightF16[5120 1280]
-
v.blk.22.ffn_up.biasF32[1280]
-
v.blk.22.ln1.weightF32[1280]
-
v.blk.22.ln1.biasF32[1280]
-
v.blk.22.ln2.weightF32[1280]
-
v.blk.22.ln2.biasF32[1280]
-
v.blk.23.attn_q.weightF16[1280 1280]
-
v.blk.23.attn_k.weightF16[1280 1280]
-
v.blk.23.attn_v.weightF16[1280 1280]
-
v.blk.23.attn_out.weightF16[1280 1280]
-
v.blk.23.ffn_down.weightF16[1280 5120]
-
v.blk.23.ffn_down.biasF32[5120]
-
v.blk.23.ffn_up.weightF16[5120 1280]
-
v.blk.23.ffn_up.biasF32[1280]
-
v.blk.23.ln1.weightF32[1280]
-
v.blk.23.ln1.biasF32[1280]
-
v.blk.23.ln2.weightF32[1280]
-
v.blk.23.ln2.biasF32[1280]
-
v.blk.24.attn_q.weightF16[1280 1280]
-
v.blk.24.attn_k.weightF16[1280 1280]
-
v.blk.24.attn_v.weightF16[1280 1280]
-
v.blk.24.attn_out.weightF16[1280 1280]
-
v.blk.24.ffn_down.weightF16[1280 5120]
-
v.blk.24.ffn_down.biasF32[5120]
-
v.blk.24.ffn_up.weightF16[5120 1280]
-
v.blk.24.ffn_up.biasF32[1280]
-
v.blk.24.ln1.weightF32[1280]
-
v.blk.24.ln1.biasF32[1280]
-
v.blk.24.ln2.weightF32[1280]
-
v.blk.24.ln2.biasF32[1280]
-
v.blk.25.attn_q.weightF16[1280 1280]
-
v.blk.25.attn_k.weightF16[1280 1280]
-
v.blk.25.attn_v.weightF16[1280 1280]
-
v.blk.25.attn_out.weightF16[1280 1280]
-
v.blk.25.ffn_down.weightF16[1280 5120]
-
v.blk.25.ffn_down.biasF32[5120]
-
v.blk.25.ffn_up.weightF16[5120 1280]
-
v.blk.25.ffn_up.biasF32[1280]
-
v.blk.25.ln1.weightF32[1280]
-
v.blk.25.ln1.biasF32[1280]
-
v.blk.25.ln2.weightF32[1280]
-
v.blk.25.ln2.biasF32[1280]
-
v.blk.26.attn_q.weightF16[1280 1280]
-
v.blk.26.attn_k.weightF16[1280 1280]
-
v.blk.26.attn_v.weightF16[1280 1280]
-
v.blk.26.attn_out.weightF16[1280 1280]
-
v.blk.26.ffn_down.weightF16[1280 5120]
-
v.blk.26.ffn_down.biasF32[5120]
-
v.blk.26.ffn_up.weightF16[5120 1280]
-
v.blk.26.ffn_up.biasF32[1280]
-
v.blk.26.ln1.weightF32[1280]
-
v.blk.26.ln1.biasF32[1280]
-
v.blk.26.ln2.weightF32[1280]
-
v.blk.26.ln2.biasF32[1280]
-
v.blk.27.attn_q.weightF16[1280 1280]
-
v.blk.27.attn_k.weightF16[1280 1280]
-
v.blk.27.attn_v.weightF16[1280 1280]
-
v.blk.27.attn_out.weightF16[1280 1280]
-
v.blk.27.ffn_down.weightF16[1280 5120]
-
v.blk.27.ffn_down.biasF32[5120]
-
v.blk.27.ffn_up.weightF16[5120 1280]
-
v.blk.27.ffn_up.biasF32[1280]
-
v.blk.27.ln1.weightF32[1280]
-
v.blk.27.ln1.biasF32[1280]
-
v.blk.27.ln2.weightF32[1280]
-
v.blk.27.ln2.biasF32[1280]
-
v.blk.28.attn_q.weightF16[1280 1280]
-
v.blk.28.attn_k.weightF16[1280 1280]
-
v.blk.28.attn_v.weightF16[1280 1280]
-
v.blk.28.attn_out.weightF16[1280 1280]
-
v.blk.28.ffn_down.weightF16[1280 5120]
-
v.blk.28.ffn_down.biasF32[5120]
-
v.blk.28.ffn_up.weightF16[5120 1280]
-
v.blk.28.ffn_up.biasF32[1280]
-
v.blk.28.ln1.weightF32[1280]
-
v.blk.28.ln1.biasF32[1280]
-
v.blk.28.ln2.weightF32[1280]
-
v.blk.28.ln2.biasF32[1280]
-
v.blk.29.attn_q.weightF16[1280 1280]
-
v.blk.29.attn_k.weightF16[1280 1280]
-
v.blk.29.attn_v.weightF16[1280 1280]
-
v.blk.29.attn_out.weightF16[1280 1280]
-
v.blk.29.ffn_down.weightF16[1280 5120]
-
v.blk.29.ffn_down.biasF32[5120]
-
v.blk.29.ffn_up.weightF16[5120 1280]
-
v.blk.29.ffn_up.biasF32[1280]
-
v.blk.29.ln1.weightF32[1280]
-
v.blk.29.ln1.biasF32[1280]
-
v.blk.29.ln2.weightF32[1280]
-
v.blk.29.ln2.biasF32[1280]
-
v.blk.30.attn_q.weightF16[1280 1280]
-
v.blk.30.attn_k.weightF16[1280 1280]
-
v.blk.30.attn_v.weightF16[1280 1280]
-
v.blk.30.attn_out.weightF16[1280 1280]
-
v.blk.30.ffn_down.weightF16[1280 5120]
-
v.blk.30.ffn_down.biasF32[5120]
-
v.blk.30.ffn_up.weightF16[5120 1280]
-
v.blk.30.ffn_up.biasF32[1280]
-
v.blk.30.ln1.weightF32[1280]
-
v.blk.30.ln1.biasF32[1280]
-
v.blk.30.ln2.weightF32[1280]
-
v.blk.30.ln2.biasF32[1280]
-
v.blk.31.attn_q.weightF16[1280 1280]
-
v.blk.31.attn_k.weightF16[1280 1280]
-
v.blk.31.attn_v.weightF16[1280 1280]
-
v.blk.31.attn_out.weightF16[1280 1280]
-
v.blk.31.ffn_down.weightF16[1280 5120]
-
v.blk.31.ffn_down.biasF32[5120]
-
v.blk.31.ffn_up.weightF16[5120 1280]
-
v.blk.31.ffn_up.biasF32[1280]
-
v.blk.31.ln1.weightF32[1280]
-
v.blk.31.ln1.biasF32[1280]
-
v.blk.31.ln2.weightF32[1280]
-
v.blk.31.ln2.biasF32[1280]
-
mm.0.weightF16[7680 4096]
-
mm.0.biasF32[4096]
-
v.pre_ln.weightF32[1280]
-
v.pre_ln.biasF32[1280]
-
v.post_ln.weightF32[1280]
-
v.post_ln.biasF32[1280]
Metadata
Tensors
v.blk.0
v.blk.1
v.blk.2
v.blk.3
v.blk.4
v.blk.5
v.blk.6
v.blk.7
v.blk.8
v.blk.9
v.blk.10
v.blk.11
v.blk.12
v.blk.13
v.blk.14
v.blk.15
v.blk.16
v.blk.17
v.blk.18
v.blk.19
v.blk.20
v.blk.21
v.blk.22
v.blk.23
v.blk.24
v.blk.25
v.blk.26
v.blk.27
v.blk.28
v.blk.29
v.blk.30
v.blk.31