latest
21GB
Vision
74 Pulls Updated 2 weeks ago
8960a0a84f08 · 1.7GB
-
general.architectureclip
-
general.file_typeF16
-
clip.has_llava_projectortrue
-
clip.has_text_encoderfalse
-
clip.has_vision_encodertrue
-
clip.projector_typemlp
-
clip.use_gelutrue
-
clip.vision.attention.head_count16
-
clip.vision.attention.layer_norm_epsilon1e-05
-
clip.vision.block_count32
-
clip.vision.embedding_length1280
-
clip.vision.feed_forward_length5120
-
clip.vision.image_mean0.48145467
-
clip.vision.image_size560
-
clip.vision.image_std0.26862955
-
clip.vision.patch_size14
-
clip.vision.projection_dim4096
-
NameTypeShape
-
v.class_embdF32[1280 1 4]
-
v.patch_embd.weightF16[14 14 3 1280]
-
v.tile_position_embd.gateF32[1]
-
v.position_embd.gateF32[1]
-
v.position_embd.weightF16[1280 1601]
-
v.tile_position_embd.weightF32[8197120]
-
v.pre_tile_position_embd.gateF32[1]
-
v.pre_tile_position_embd.weightF32[5120]
-
v.post_tile_position_embd.gateF32[1]
-
v.post_tile_position_embd.weightF32[5120]
-
v.blk.0.attn_q.weightF16[1280 1280]
-
v.blk.0.attn_k.weightF16[1280 1280]
-
v.blk.0.attn_v.weightF16[1280 1280]
-
v.blk.0.attn_out.weightF16[1280 1280]
-
v.blk.0.ffn_down.weightF16[1280 5120]
-
v.blk.0.ffn_down.biasF32[5120]
-
v.blk.0.ffn_up.weightF16[5120 1280]
-
v.blk.0.ffn_up.biasF32[1280]
-
v.blk.0.ln1.weightF32[1280]
-
v.blk.0.ln1.biasF32[1280]
-
v.blk.0.ln2.weightF32[1280]
-
v.blk.0.ln2.biasF32[1280]
-
v.global.blk.0.attn_gateF32[1]
-
v.global.blk.0.ffn_gateF32[1]
-
v.global.blk.0.attn_q.weightF16[1280 1280]
-
v.global.blk.0.attn_k.weightF16[1280 1280]
-
v.global.blk.0.attn_v.weightF16[1280 1280]
-
v.global.blk.0.attn_out.weightF16[1280 1280]
-
v.global.blk.0.ffn_down.weightF16[1280 5120]
-
v.global.blk.0.ffn_down.biasF32[5120]
-
v.global.blk.0.ffn_up.weightF16[5120 1280]
-
v.global.blk.0.ffn_up.biasF32[1280]
-
v.global.blk.0.ln1.weightF32[1280]
-
v.global.blk.0.ln1.biasF32[1280]
-
v.global.blk.0.ln2.weightF32[1280]
-
v.global.blk.0.ln2.biasF32[1280]
-
v.blk.1.attn_q.weightF16[1280 1280]
-
v.blk.1.attn_k.weightF16[1280 1280]
-
v.blk.1.attn_v.weightF16[1280 1280]
-
v.blk.1.attn_out.weightF16[1280 1280]
-
v.blk.1.ffn_down.weightF16[1280 5120]
-
v.blk.1.ffn_down.biasF32[5120]
-
v.blk.1.ffn_up.weightF16[5120 1280]
-
v.blk.1.ffn_up.biasF32[1280]
-
v.blk.1.ln1.weightF32[1280]
-
v.blk.1.ln1.biasF32[1280]
-
v.blk.1.ln2.weightF32[1280]
-
v.blk.1.ln2.biasF32[1280]
-
v.global.blk.1.attn_gateF32[1]
-
v.global.blk.1.ffn_gateF32[1]
-
v.global.blk.1.attn_q.weightF16[1280 1280]
-
v.global.blk.1.attn_k.weightF16[1280 1280]
-
v.global.blk.1.attn_v.weightF16[1280 1280]
-
v.global.blk.1.attn_out.weightF16[1280 1280]
-
v.global.blk.1.ffn_down.weightF16[1280 5120]
-
v.global.blk.1.ffn_down.biasF32[5120]
-
v.global.blk.1.ffn_up.weightF16[5120 1280]
-
v.global.blk.1.ffn_up.biasF32[1280]
-
v.global.blk.1.ln1.weightF32[1280]
-
v.global.blk.1.ln1.biasF32[1280]
-
v.global.blk.1.ln2.weightF32[1280]
-
v.global.blk.1.ln2.biasF32[1280]
-
v.blk.2.attn_q.weightF16[1280 1280]
-
v.blk.2.attn_k.weightF16[1280 1280]
-
v.blk.2.attn_v.weightF16[1280 1280]
-
v.blk.2.attn_out.weightF16[1280 1280]
-
v.blk.2.ffn_down.weightF16[1280 5120]
-
v.blk.2.ffn_down.biasF32[5120]
-
v.blk.2.ffn_up.weightF16[5120 1280]
-
v.blk.2.ffn_up.biasF32[1280]
-
v.blk.2.ln1.weightF32[1280]
-
v.blk.2.ln1.biasF32[1280]
-
v.blk.2.ln2.weightF32[1280]
-
v.blk.2.ln2.biasF32[1280]
-
v.global.blk.2.attn_gateF32[1]
-
v.global.blk.2.ffn_gateF32[1]
-
v.global.blk.2.attn_q.weightF16[1280 1280]
-
v.global.blk.2.attn_k.weightF16[1280 1280]
-
v.global.blk.2.attn_v.weightF16[1280 1280]
-
v.global.blk.2.attn_out.weightF16[1280 1280]
-
v.global.blk.2.ffn_down.weightF16[1280 5120]
-
v.global.blk.2.ffn_down.biasF32[5120]
-
v.global.blk.2.ffn_up.weightF16[5120 1280]
-
v.global.blk.2.ffn_up.biasF32[1280]
-
v.global.blk.2.ln1.weightF32[1280]
-
v.global.blk.2.ln1.biasF32[1280]
-
v.global.blk.2.ln2.weightF32[1280]
-
v.global.blk.2.ln2.biasF32[1280]
-
v.blk.3.attn_q.weightF16[1280 1280]
-
v.blk.3.attn_k.weightF16[1280 1280]
-
v.blk.3.attn_v.weightF16[1280 1280]
-
v.blk.3.attn_out.weightF16[1280 1280]
-
v.blk.3.ffn_down.weightF16[1280 5120]
-
v.blk.3.ffn_down.biasF32[5120]
-
v.blk.3.ffn_up.weightF16[5120 1280]
-
v.blk.3.ffn_up.biasF32[1280]
-
v.blk.3.ln1.weightF32[1280]
-
v.blk.3.ln1.biasF32[1280]
-
v.blk.3.ln2.weightF32[1280]
-
v.blk.3.ln2.biasF32[1280]
-
v.global.blk.3.attn_gateF32[1]
-
v.global.blk.3.ffn_gateF32[1]
-
v.global.blk.3.attn_q.weightF16[1280 1280]
-
v.global.blk.3.attn_k.weightF16[1280 1280]
-
v.global.blk.3.attn_v.weightF16[1280 1280]
-
v.global.blk.3.attn_out.weightF16[1280 1280]
-
v.global.blk.3.ffn_down.weightF16[1280 5120]
-
v.global.blk.3.ffn_down.biasF32[5120]
-
v.global.blk.3.ffn_up.weightF16[5120 1280]
-
v.global.blk.3.ffn_up.biasF32[1280]
-
v.global.blk.3.ln1.weightF32[1280]
-
v.global.blk.3.ln1.biasF32[1280]
-
v.global.blk.3.ln2.weightF32[1280]
-
v.global.blk.3.ln2.biasF32[1280]
-
v.blk.4.attn_q.weightF16[1280 1280]
-
v.blk.4.attn_k.weightF16[1280 1280]
-
v.blk.4.attn_v.weightF16[1280 1280]
-
v.blk.4.attn_out.weightF16[1280 1280]
-
v.blk.4.ffn_down.weightF16[1280 5120]
-
v.blk.4.ffn_down.biasF32[5120]
-
v.blk.4.ffn_up.weightF16[5120 1280]
-
v.blk.4.ffn_up.biasF32[1280]
-
v.blk.4.ln1.weightF32[1280]
-
v.blk.4.ln1.biasF32[1280]
-
v.blk.4.ln2.weightF32[1280]
-
v.blk.4.ln2.biasF32[1280]
-
v.global.blk.4.attn_gateF32[1]
-
v.global.blk.4.ffn_gateF32[1]
-
v.global.blk.4.attn_q.weightF16[1280 1280]
-
v.global.blk.4.attn_k.weightF16[1280 1280]
-
v.global.blk.4.attn_v.weightF16[1280 1280]
-
v.global.blk.4.attn_out.weightF16[1280 1280]
-
v.global.blk.4.ffn_down.weightF16[1280 5120]
-
v.global.blk.4.ffn_down.biasF32[5120]
-
v.global.blk.4.ffn_up.weightF16[5120 1280]
-
v.global.blk.4.ffn_up.biasF32[1280]
-
v.global.blk.4.ln1.weightF32[1280]
-
v.global.blk.4.ln1.biasF32[1280]
-
v.global.blk.4.ln2.weightF32[1280]
-
v.global.blk.4.ln2.biasF32[1280]
-
v.blk.5.attn_q.weightF16[1280 1280]
-
v.blk.5.attn_k.weightF16[1280 1280]
-
v.blk.5.attn_v.weightF16[1280 1280]
-
v.blk.5.attn_out.weightF16[1280 1280]
-
v.blk.5.ffn_down.weightF16[1280 5120]
-
v.blk.5.ffn_down.biasF32[5120]
-
v.blk.5.ffn_up.weightF16[5120 1280]
-
v.blk.5.ffn_up.biasF32[1280]
-
v.blk.5.ln1.weightF32[1280]
-
v.blk.5.ln1.biasF32[1280]
-
v.blk.5.ln2.weightF32[1280]
-
v.blk.5.ln2.biasF32[1280]
-
v.global.blk.5.attn_gateF32[1]
-
v.global.blk.5.ffn_gateF32[1]
-
v.global.blk.5.attn_q.weightF16[1280 1280]
-
v.global.blk.5.attn_k.weightF16[1280 1280]
-
v.global.blk.5.attn_v.weightF16[1280 1280]
-
v.global.blk.5.attn_out.weightF16[1280 1280]
-
v.global.blk.5.ffn_down.weightF16[1280 5120]
-
v.global.blk.5.ffn_down.biasF32[5120]
-
v.global.blk.5.ffn_up.weightF16[5120 1280]
-
v.global.blk.5.ffn_up.biasF32[1280]
-
v.global.blk.5.ln1.weightF32[1280]
-
v.global.blk.5.ln1.biasF32[1280]
-
v.global.blk.5.ln2.weightF32[1280]
-
v.global.blk.5.ln2.biasF32[1280]
-
v.blk.6.attn_q.weightF16[1280 1280]
-
v.blk.6.attn_k.weightF16[1280 1280]
-
v.blk.6.attn_v.weightF16[1280 1280]
-
v.blk.6.attn_out.weightF16[1280 1280]
-
v.blk.6.ffn_down.weightF16[1280 5120]
-
v.blk.6.ffn_down.biasF32[5120]
-
v.blk.6.ffn_up.weightF16[5120 1280]
-
v.blk.6.ffn_up.biasF32[1280]
-
v.blk.6.ln1.weightF32[1280]
-
v.blk.6.ln1.biasF32[1280]
-
v.blk.6.ln2.weightF32[1280]
-
v.blk.6.ln2.biasF32[1280]
-
v.global.blk.6.attn_gateF32[1]
-
v.global.blk.6.ffn_gateF32[1]
-
v.global.blk.6.attn_q.weightF16[1280 1280]
-
v.global.blk.6.attn_k.weightF16[1280 1280]
-
v.global.blk.6.attn_v.weightF16[1280 1280]
-
v.global.blk.6.attn_out.weightF16[1280 1280]
-
v.global.blk.6.ffn_down.weightF16[1280 5120]
-
v.global.blk.6.ffn_down.biasF32[5120]
-
v.global.blk.6.ffn_up.weightF16[5120 1280]
-
v.global.blk.6.ffn_up.biasF32[1280]
-
v.global.blk.6.ln1.weightF32[1280]
-
v.global.blk.6.ln1.biasF32[1280]
-
v.global.blk.6.ln2.weightF32[1280]
-
v.global.blk.6.ln2.biasF32[1280]
-
v.blk.7.attn_q.weightF16[1280 1280]
-
v.blk.7.attn_k.weightF16[1280 1280]
-
v.blk.7.attn_v.weightF16[1280 1280]
-
v.blk.7.attn_out.weightF16[1280 1280]
-
v.blk.7.ffn_down.weightF16[1280 5120]
-
v.blk.7.ffn_down.biasF32[5120]
-
v.blk.7.ffn_up.weightF16[5120 1280]
-
v.blk.7.ffn_up.biasF32[1280]
-
v.blk.7.ln1.weightF32[1280]
-
v.blk.7.ln1.biasF32[1280]
-
v.blk.7.ln2.weightF32[1280]
-
v.blk.7.ln2.biasF32[1280]
-
v.global.blk.7.attn_gateF32[1]
-
v.global.blk.7.ffn_gateF32[1]
-
v.global.blk.7.attn_q.weightF16[1280 1280]
-
v.global.blk.7.attn_k.weightF16[1280 1280]
-
v.global.blk.7.attn_v.weightF16[1280 1280]
-
v.global.blk.7.attn_out.weightF16[1280 1280]
-
v.global.blk.7.ffn_down.weightF16[1280 5120]
-
v.global.blk.7.ffn_down.biasF32[5120]
-
v.global.blk.7.ffn_up.weightF16[5120 1280]
-
v.global.blk.7.ffn_up.biasF32[1280]
-
v.global.blk.7.ln1.weightF32[1280]
-
v.global.blk.7.ln1.biasF32[1280]
-
v.global.blk.7.ln2.weightF32[1280]
-
v.global.blk.7.ln2.biasF32[1280]
-
v.blk.8.attn_q.weightF16[1280 1280]
-
v.blk.8.attn_k.weightF16[1280 1280]
-
v.blk.8.attn_v.weightF16[1280 1280]
-
v.blk.8.attn_out.weightF16[1280 1280]
-
v.blk.8.ffn_down.weightF16[1280 5120]
-
v.blk.8.ffn_down.biasF32[5120]
-
v.blk.8.ffn_up.weightF16[5120 1280]
-
v.blk.8.ffn_up.biasF32[1280]
-
v.blk.8.ln1.weightF32[1280]
-
v.blk.8.ln1.biasF32[1280]
-
v.blk.8.ln2.weightF32[1280]
-
v.blk.8.ln2.biasF32[1280]
-
v.blk.9.attn_q.weightF16[1280 1280]
-
v.blk.9.attn_k.weightF16[1280 1280]
-
v.blk.9.attn_v.weightF16[1280 1280]
-
v.blk.9.attn_out.weightF16[1280 1280]
-
v.blk.9.ffn_down.weightF16[1280 5120]
-
v.blk.9.ffn_down.biasF32[5120]
-
v.blk.9.ffn_up.weightF16[5120 1280]
-
v.blk.9.ffn_up.biasF32[1280]
-
v.blk.9.ln1.weightF32[1280]
-
v.blk.9.ln1.biasF32[1280]
-
v.blk.9.ln2.weightF32[1280]
-
v.blk.9.ln2.biasF32[1280]
-
v.blk.10.attn_q.weightF16[1280 1280]
-
v.blk.10.attn_k.weightF16[1280 1280]
-
v.blk.10.attn_v.weightF16[1280 1280]
-
v.blk.10.attn_out.weightF16[1280 1280]
-
v.blk.10.ffn_down.weightF16[1280 5120]
-
v.blk.10.ffn_down.biasF32[5120]
-
v.blk.10.ffn_up.weightF16[5120 1280]
-
v.blk.10.ffn_up.biasF32[1280]
-
v.blk.10.ln1.weightF32[1280]
-
v.blk.10.ln1.biasF32[1280]
-
v.blk.10.ln2.weightF32[1280]
-
v.blk.10.ln2.biasF32[1280]
-
v.blk.11.attn_q.weightF16[1280 1280]
-
v.blk.11.attn_k.weightF16[1280 1280]
-
v.blk.11.attn_v.weightF16[1280 1280]
-
v.blk.11.attn_out.weightF16[1280 1280]
-
v.blk.11.ffn_down.weightF16[1280 5120]
-
v.blk.11.ffn_down.biasF32[5120]
-
v.blk.11.ffn_up.weightF16[5120 1280]
-
v.blk.11.ffn_up.biasF32[1280]
-
v.blk.11.ln1.weightF32[1280]
-
v.blk.11.ln1.biasF32[1280]
-
v.blk.11.ln2.weightF32[1280]
-
v.blk.11.ln2.biasF32[1280]
-
v.blk.12.attn_q.weightF16[1280 1280]
-
v.blk.12.attn_k.weightF16[1280 1280]
-
v.blk.12.attn_v.weightF16[1280 1280]
-
v.blk.12.attn_out.weightF16[1280 1280]
-
v.blk.12.ffn_down.weightF16[1280 5120]
-
v.blk.12.ffn_down.biasF32[5120]
-
v.blk.12.ffn_up.weightF16[5120 1280]
-
v.blk.12.ffn_up.biasF32[1280]
-
v.blk.12.ln1.weightF32[1280]
-
v.blk.12.ln1.biasF32[1280]
-
v.blk.12.ln2.weightF32[1280]
-
v.blk.12.ln2.biasF32[1280]
-
v.blk.13.attn_q.weightF16[1280 1280]
-
v.blk.13.attn_k.weightF16[1280 1280]
-
v.blk.13.attn_v.weightF16[1280 1280]
-
v.blk.13.attn_out.weightF16[1280 1280]
-
v.blk.13.ffn_down.weightF16[1280 5120]
-
v.blk.13.ffn_down.biasF32[5120]
-
v.blk.13.ffn_up.weightF16[5120 1280]
-
v.blk.13.ffn_up.biasF32[1280]
-
v.blk.13.ln1.weightF32[1280]
-
v.blk.13.ln1.biasF32[1280]
-
v.blk.13.ln2.weightF32[1280]
-
v.blk.13.ln2.biasF32[1280]
-
v.blk.14.attn_q.weightF16[1280 1280]
-
v.blk.14.attn_k.weightF16[1280 1280]
-
v.blk.14.attn_v.weightF16[1280 1280]
-
v.blk.14.attn_out.weightF16[1280 1280]
-
v.blk.14.ffn_down.weightF16[1280 5120]
-
v.blk.14.ffn_down.biasF32[5120]
-
v.blk.14.ffn_up.weightF16[5120 1280]
-
v.blk.14.ffn_up.biasF32[1280]
-
v.blk.14.ln1.weightF32[1280]
-
v.blk.14.ln1.biasF32[1280]
-
v.blk.14.ln2.weightF32[1280]
-
v.blk.14.ln2.biasF32[1280]
-
v.blk.15.attn_q.weightF16[1280 1280]
-
v.blk.15.attn_k.weightF16[1280 1280]
-
v.blk.15.attn_v.weightF16[1280 1280]
-
v.blk.15.attn_out.weightF16[1280 1280]
-
v.blk.15.ffn_down.weightF16[1280 5120]
-
v.blk.15.ffn_down.biasF32[5120]
-
v.blk.15.ffn_up.weightF16[5120 1280]
-
v.blk.15.ffn_up.biasF32[1280]
-
v.blk.15.ln1.weightF32[1280]
-
v.blk.15.ln1.biasF32[1280]
-
v.blk.15.ln2.weightF32[1280]
-
v.blk.15.ln2.biasF32[1280]
-
v.blk.16.attn_q.weightF16[1280 1280]
-
v.blk.16.attn_k.weightF16[1280 1280]
-
v.blk.16.attn_v.weightF16[1280 1280]
-
v.blk.16.attn_out.weightF16[1280 1280]
-
v.blk.16.ffn_down.weightF16[1280 5120]
-
v.blk.16.ffn_down.biasF32[5120]
-
v.blk.16.ffn_up.weightF16[5120 1280]
-
v.blk.16.ffn_up.biasF32[1280]
-
v.blk.16.ln1.weightF32[1280]
-
v.blk.16.ln1.biasF32[1280]
-
v.blk.16.ln2.weightF32[1280]
-
v.blk.16.ln2.biasF32[1280]
-
v.blk.17.attn_q.weightF16[1280 1280]
-
v.blk.17.attn_k.weightF16[1280 1280]
-
v.blk.17.attn_v.weightF16[1280 1280]
-
v.blk.17.attn_out.weightF16[1280 1280]
-
v.blk.17.ffn_down.weightF16[1280 5120]
-
v.blk.17.ffn_down.biasF32[5120]
-
v.blk.17.ffn_up.weightF16[5120 1280]
-
v.blk.17.ffn_up.biasF32[1280]
-
v.blk.17.ln1.weightF32[1280]
-
v.blk.17.ln1.biasF32[1280]
-
v.blk.17.ln2.weightF32[1280]
-
v.blk.17.ln2.biasF32[1280]
-
v.blk.18.attn_q.weightF16[1280 1280]
-
v.blk.18.attn_k.weightF16[1280 1280]
-
v.blk.18.attn_v.weightF16[1280 1280]
-
v.blk.18.attn_out.weightF16[1280 1280]
-
v.blk.18.ffn_down.weightF16[1280 5120]
-
v.blk.18.ffn_down.biasF32[5120]
-
v.blk.18.ffn_up.weightF16[5120 1280]
-
v.blk.18.ffn_up.biasF32[1280]
-
v.blk.18.ln1.weightF32[1280]
-
v.blk.18.ln1.biasF32[1280]
-
v.blk.18.ln2.weightF32[1280]
-
v.blk.18.ln2.biasF32[1280]
-
v.blk.19.attn_q.weightF16[1280 1280]
-
v.blk.19.attn_k.weightF16[1280 1280]
-
v.blk.19.attn_v.weightF16[1280 1280]
-
v.blk.19.attn_out.weightF16[1280 1280]
-
v.blk.19.ffn_down.weightF16[1280 5120]
-
v.blk.19.ffn_down.biasF32[5120]
-
v.blk.19.ffn_up.weightF16[5120 1280]
-
v.blk.19.ffn_up.biasF32[1280]
-
v.blk.19.ln1.weightF32[1280]
-
v.blk.19.ln1.biasF32[1280]
-
v.blk.19.ln2.weightF32[1280]
-
v.blk.19.ln2.biasF32[1280]
-
v.blk.20.attn_q.weightF16[1280 1280]
-
v.blk.20.attn_k.weightF16[1280 1280]
-
v.blk.20.attn_v.weightF16[1280 1280]
-
v.blk.20.attn_out.weightF16[1280 1280]
-
v.blk.20.ffn_down.weightF16[1280 5120]
-
v.blk.20.ffn_down.biasF32[5120]
-
v.blk.20.ffn_up.weightF16[5120 1280]
-
v.blk.20.ffn_up.biasF32[1280]
-
v.blk.20.ln1.weightF32[1280]
-
v.blk.20.ln1.biasF32[1280]
-
v.blk.20.ln2.weightF32[1280]
-
v.blk.20.ln2.biasF32[1280]
-
v.blk.21.attn_q.weightF16[1280 1280]
-
v.blk.21.attn_k.weightF16[1280 1280]
-
v.blk.21.attn_v.weightF16[1280 1280]
-
v.blk.21.attn_out.weightF16[1280 1280]
-
v.blk.21.ffn_down.weightF16[1280 5120]
-
v.blk.21.ffn_down.biasF32[5120]
-
v.blk.21.ffn_up.weightF16[5120 1280]
-
v.blk.21.ffn_up.biasF32[1280]
-
v.blk.21.ln1.weightF32[1280]
-
v.blk.21.ln1.biasF32[1280]
-
v.blk.21.ln2.weightF32[1280]
-
v.blk.21.ln2.biasF32[1280]
-
v.blk.22.attn_q.weightF16[1280 1280]
-
v.blk.22.attn_k.weightF16[1280 1280]
-
v.blk.22.attn_v.weightF16[1280 1280]
-
v.blk.22.attn_out.weightF16[1280 1280]
-
v.blk.22.ffn_down.weightF16[1280 5120]
-
v.blk.22.ffn_down.biasF32[5120]
-
v.blk.22.ffn_up.weightF16[5120 1280]
-
v.blk.22.ffn_up.biasF32[1280]
-
v.blk.22.ln1.weightF32[1280]
-
v.blk.22.ln1.biasF32[1280]
-
v.blk.22.ln2.weightF32[1280]
-
v.blk.22.ln2.biasF32[1280]
-
v.blk.23.attn_q.weightF16[1280 1280]
-
v.blk.23.attn_k.weightF16[1280 1280]
-
v.blk.23.attn_v.weightF16[1280 1280]
-
v.blk.23.attn_out.weightF16[1280 1280]
-
v.blk.23.ffn_down.weightF16[1280 5120]
-
v.blk.23.ffn_down.biasF32[5120]
-
v.blk.23.ffn_up.weightF16[5120 1280]
-
v.blk.23.ffn_up.biasF32[1280]
-
v.blk.23.ln1.weightF32[1280]
-
v.blk.23.ln1.biasF32[1280]
-
v.blk.23.ln2.weightF32[1280]
-
v.blk.23.ln2.biasF32[1280]
-
v.blk.24.attn_q.weightF16[1280 1280]
-
v.blk.24.attn_k.weightF16[1280 1280]
-
v.blk.24.attn_v.weightF16[1280 1280]
-
v.blk.24.attn_out.weightF16[1280 1280]
-
v.blk.24.ffn_down.weightF16[1280 5120]
-
v.blk.24.ffn_down.biasF32[5120]
-
v.blk.24.ffn_up.weightF16[5120 1280]
-
v.blk.24.ffn_up.biasF32[1280]
-
v.blk.24.ln1.weightF32[1280]
-
v.blk.24.ln1.biasF32[1280]
-
v.blk.24.ln2.weightF32[1280]
-
v.blk.24.ln2.biasF32[1280]
-
v.blk.25.attn_q.weightF16[1280 1280]
-
v.blk.25.attn_k.weightF16[1280 1280]
-
v.blk.25.attn_v.weightF16[1280 1280]
-
v.blk.25.attn_out.weightF16[1280 1280]
-
v.blk.25.ffn_down.weightF16[1280 5120]
-
v.blk.25.ffn_down.biasF32[5120]
-
v.blk.25.ffn_up.weightF16[5120 1280]
-
v.blk.25.ffn_up.biasF32[1280]
-
v.blk.25.ln1.weightF32[1280]
-
v.blk.25.ln1.biasF32[1280]
-
v.blk.25.ln2.weightF32[1280]
-
v.blk.25.ln2.biasF32[1280]
-
v.blk.26.attn_q.weightF16[1280 1280]
-
v.blk.26.attn_k.weightF16[1280 1280]
-
v.blk.26.attn_v.weightF16[1280 1280]
-
v.blk.26.attn_out.weightF16[1280 1280]
-
v.blk.26.ffn_down.weightF16[1280 5120]
-
v.blk.26.ffn_down.biasF32[5120]
-
v.blk.26.ffn_up.weightF16[5120 1280]
-
v.blk.26.ffn_up.biasF32[1280]
-
v.blk.26.ln1.weightF32[1280]
-
v.blk.26.ln1.biasF32[1280]
-
v.blk.26.ln2.weightF32[1280]
-
v.blk.26.ln2.biasF32[1280]
-
v.blk.27.attn_q.weightF16[1280 1280]
-
v.blk.27.attn_k.weightF16[1280 1280]
-
v.blk.27.attn_v.weightF16[1280 1280]
-
v.blk.27.attn_out.weightF16[1280 1280]
-
v.blk.27.ffn_down.weightF16[1280 5120]
-
v.blk.27.ffn_down.biasF32[5120]
-
v.blk.27.ffn_up.weightF16[5120 1280]
-
v.blk.27.ffn_up.biasF32[1280]
-
v.blk.27.ln1.weightF32[1280]
-
v.blk.27.ln1.biasF32[1280]
-
v.blk.27.ln2.weightF32[1280]
-
v.blk.27.ln2.biasF32[1280]
-
v.blk.28.attn_q.weightF16[1280 1280]
-
v.blk.28.attn_k.weightF16[1280 1280]
-
v.blk.28.attn_v.weightF16[1280 1280]
-
v.blk.28.attn_out.weightF16[1280 1280]
-
v.blk.28.ffn_down.weightF16[1280 5120]
-
v.blk.28.ffn_down.biasF32[5120]
-
v.blk.28.ffn_up.weightF16[5120 1280]
-
v.blk.28.ffn_up.biasF32[1280]
-
v.blk.28.ln1.weightF32[1280]
-
v.blk.28.ln1.biasF32[1280]
-
v.blk.28.ln2.weightF32[1280]
-
v.blk.28.ln2.biasF32[1280]
-
v.blk.29.attn_q.weightF16[1280 1280]
-
v.blk.29.attn_k.weightF16[1280 1280]
-
v.blk.29.attn_v.weightF16[1280 1280]
-
v.blk.29.attn_out.weightF16[1280 1280]
-
v.blk.29.ffn_down.weightF16[1280 5120]
-
v.blk.29.ffn_down.biasF32[5120]
-
v.blk.29.ffn_up.weightF16[5120 1280]
-
v.blk.29.ffn_up.biasF32[1280]
-
v.blk.29.ln1.weightF32[1280]
-
v.blk.29.ln1.biasF32[1280]
-
v.blk.29.ln2.weightF32[1280]
-
v.blk.29.ln2.biasF32[1280]
-
v.blk.30.attn_q.weightF16[1280 1280]
-
v.blk.30.attn_k.weightF16[1280 1280]
-
v.blk.30.attn_v.weightF16[1280 1280]
-
v.blk.30.attn_out.weightF16[1280 1280]
-
v.blk.30.ffn_down.weightF16[1280 5120]
-
v.blk.30.ffn_down.biasF32[5120]
-
v.blk.30.ffn_up.weightF16[5120 1280]
-
v.blk.30.ffn_up.biasF32[1280]
-
v.blk.30.ln1.weightF32[1280]
-
v.blk.30.ln1.biasF32[1280]
-
v.blk.30.ln2.weightF32[1280]
-
v.blk.30.ln2.biasF32[1280]
-
v.blk.31.attn_q.weightF16[1280 1280]
-
v.blk.31.attn_k.weightF16[1280 1280]
-
v.blk.31.attn_v.weightF16[1280 1280]
-
v.blk.31.attn_out.weightF16[1280 1280]
-
v.blk.31.ffn_down.weightF16[1280 5120]
-
v.blk.31.ffn_down.biasF32[5120]
-
v.blk.31.ffn_up.weightF16[5120 1280]
-
v.blk.31.ffn_up.biasF32[1280]
-
v.blk.31.ln1.weightF32[1280]
-
v.blk.31.ln1.biasF32[1280]
-
v.blk.31.ln2.weightF32[1280]
-
v.blk.31.ln2.biasF32[1280]
-
mm.0.weightF16[7680 4096]
-
mm.0.biasF32[4096]
-
v.pre_ln.weightF32[1280]
-
v.pre_ln.biasF32[1280]
-
v.post_ln.weightF32[1280]
-
v.post_ln.biasF32[1280]
Metadata
Tensors
v.blk.0
v.blk.1
v.blk.2
v.blk.3
v.blk.4
v.blk.5
v.blk.6
v.blk.7
v.blk.8
v.blk.9
v.blk.10
v.blk.11
v.blk.12
v.blk.13
v.blk.14
v.blk.15
v.blk.16
v.blk.17
v.blk.18
v.blk.19
v.blk.20
v.blk.21
v.blk.22
v.blk.23
v.blk.24
v.blk.25
v.blk.26
v.blk.27
v.blk.28
v.blk.29
v.blk.30
v.blk.31