Models
Docs
Pricing
Sign in
Download
Models
Download
Docs
Pricing
Sign in
HSR-DeepThink
/
nwe
:latest
598
Downloads
Updated
3 weeks ago
Image Generator lightweight than x/flux model uses compresion built using LoRA
Image Generator lightweight than x/flux model uses compresion built using LoRA
Cancel
nwe:latest
...
/
model
b8944e9fe0b6 · 1.6GB
Metadata
Tensor
Name
Type
Shape
alphas_cumprod
F16
F16
[1000]
cond_stage_model.transformer.text_model.embeddings.position_embedding.weight
Q4_0
Q4_0
[768, 77]
cond_stage_model.transformer.text_model.embeddings.token_embedding.weight
Q4_0
Q4_0
[768, 49408]
cond_stage_model.transformer.text_model.encoder.layers.0.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.0.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.0.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.0.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.1.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.1.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.1.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.1.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.2.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.2.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.2.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.2.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.3.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.3.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.3.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.3.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.4.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.4.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.4.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.4.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.5.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.5.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.5.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.5.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.6.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.6.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.6.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.6.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.7.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.7.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.7.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.7.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.8.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.8.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.8.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.8.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.9.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.9.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.9.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.9.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.10.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.10.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.10.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.10.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.11.layer_norm1.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.layer_norm1.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.layer_norm2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.layer_norm2.weight
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.mlp.fc1.bias
Q4_0
Q4_0
[3072]
cond_stage_model.transformer.text_model.encoder.layers.11.mlp.fc1.weight
Q4_0
Q4_0
[768, 3072]
cond_stage_model.transformer.text_model.encoder.layers.11.mlp.fc2.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.mlp.fc2.weight
Q4_0
Q4_0
[3072, 768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.k_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.k_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.out_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.out_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.q_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.q_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.v_proj.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.encoder.layers.11.self_attn.v_proj.weight
Q4_0
Q4_0
[768, 768]
cond_stage_model.transformer.text_model.final_layer_norm.bias
Q4_0
Q4_0
[768]
cond_stage_model.transformer.text_model.final_layer_norm.weight
Q4_0
Q4_0
[768]
first_stage_model.decoder.conv_in.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.conv_in.weight
F16
F16
[3, 3, 4, 512]
first_stage_model.decoder.conv_out.bias
F16
F16
[3]
first_stage_model.decoder.conv_out.weight
F16
F16
[3, 3, 128, 3]
first_stage_model.decoder.mid.attn_1.k.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.k.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.decoder.mid.attn_1.norm.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.norm.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.proj_out.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.proj_out.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.decoder.mid.attn_1.q.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.q.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.decoder.mid.attn_1.v.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.attn_1.v.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.decoder.mid.block_1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.mid.block_1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.mid.block_1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.mid.block_2.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.mid.block_2.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.mid.block_2.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.norm_out.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.norm_out.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.0.conv1.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.0.conv1.weight
F16
F16
[3, 3, 256, 128]
first_stage_model.decoder.up.0.block.0.conv2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.0.conv2.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.decoder.up.0.block.0.nin_shortcut.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.0.nin_shortcut.weight
F16
F16
[1, 1, 256, 128]
first_stage_model.decoder.up.0.block.0.norm1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.0.block.0.norm1.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.0.block.0.norm2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.0.norm2.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.conv1.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.conv1.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.decoder.up.0.block.1.conv2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.conv2.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.decoder.up.0.block.1.norm1.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.norm1.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.norm2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.1.norm2.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.conv1.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.conv1.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.decoder.up.0.block.2.conv2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.conv2.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.decoder.up.0.block.2.norm1.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.norm1.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.norm2.bias
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.0.block.2.norm2.weight
Q4_0
Q4_0
[128]
first_stage_model.decoder.up.1.block.0.conv1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.0.conv1.weight
F16
F16
[3, 3, 512, 256]
first_stage_model.decoder.up.1.block.0.conv2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.0.conv2.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.1.block.0.nin_shortcut.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.0.nin_shortcut.weight
F16
F16
[1, 1, 512, 256]
first_stage_model.decoder.up.1.block.0.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.1.block.0.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.1.block.0.norm2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.0.norm2.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.conv1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.conv1.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.1.block.1.conv2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.conv2.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.1.block.1.norm1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.norm1.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.norm2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.1.norm2.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.conv1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.conv1.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.1.block.2.conv2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.conv2.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.1.block.2.norm1.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.norm1.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.norm2.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.block.2.norm2.weight
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.upsample.conv.bias
Q4_0
Q4_0
[256]
first_stage_model.decoder.up.1.upsample.conv.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.decoder.up.2.block.0.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.0.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.0.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.0.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.0.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.0.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.0.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.0.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.2.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.2.block.2.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.block.2.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.upsample.conv.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.2.upsample.conv.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.0.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.0.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.0.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.0.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.0.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.0.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.0.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.0.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.2.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.decoder.up.3.block.2.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.block.2.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.upsample.conv.bias
Q4_0
Q4_0
[512]
first_stage_model.decoder.up.3.upsample.conv.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.conv_in.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.conv_in.weight
F16
F16
[3, 3, 3, 128]
first_stage_model.encoder.conv_out.bias
F16
F16
[8]
first_stage_model.encoder.conv_out.weight
F16
F16
[3, 3, 512, 8]
first_stage_model.encoder.down.0.block.0.conv1.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.0.conv1.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.encoder.down.0.block.0.conv2.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.0.conv2.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.encoder.down.0.block.0.norm1.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.0.norm1.weight
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.0.norm2.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.0.norm2.weight
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.conv1.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.conv1.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.encoder.down.0.block.1.conv2.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.conv2.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.encoder.down.0.block.1.norm1.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.norm1.weight
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.norm2.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.block.1.norm2.weight
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.downsample.conv.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.0.downsample.conv.weight
F16
F16
[3, 3, 128, 128]
first_stage_model.encoder.down.1.block.0.conv1.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.0.conv1.weight
F16
F16
[3, 3, 128, 256]
first_stage_model.encoder.down.1.block.0.conv2.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.0.conv2.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.encoder.down.1.block.0.nin_shortcut.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.0.nin_shortcut.weight
F16
F16
[1, 1, 128, 256]
first_stage_model.encoder.down.1.block.0.norm1.bias
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.1.block.0.norm1.weight
Q4_0
Q4_0
[128]
first_stage_model.encoder.down.1.block.0.norm2.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.0.norm2.weight
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.conv1.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.conv1.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.encoder.down.1.block.1.conv2.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.conv2.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.encoder.down.1.block.1.norm1.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.norm1.weight
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.norm2.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.block.1.norm2.weight
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.downsample.conv.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.1.downsample.conv.weight
F16
F16
[3, 3, 256, 256]
first_stage_model.encoder.down.2.block.0.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.0.conv1.weight
F16
F16
[3, 3, 256, 512]
first_stage_model.encoder.down.2.block.0.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.0.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.2.block.0.nin_shortcut.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.0.nin_shortcut.weight
F16
F16
[1, 1, 256, 512]
first_stage_model.encoder.down.2.block.0.norm1.bias
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.2.block.0.norm1.weight
Q4_0
Q4_0
[256]
first_stage_model.encoder.down.2.block.0.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.0.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.2.block.1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.2.block.1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.block.1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.downsample.conv.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.2.downsample.conv.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.3.block.0.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.0.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.3.block.0.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.0.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.3.block.0.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.0.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.0.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.0.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.3.block.1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.down.3.block.1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.down.3.block.1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.k.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.k.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.encoder.mid.attn_1.norm.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.norm.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.proj_out.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.proj_out.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.encoder.mid.attn_1.q.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.q.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.encoder.mid.attn_1.v.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.attn_1.v.weight
F16
F16
[1, 1, 512, 512]
first_stage_model.encoder.mid.block_1.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_1.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.mid.block_1.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_1.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.mid.block_1.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_1.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_1.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_1.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.conv1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.conv1.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.mid.block_2.conv2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.conv2.weight
F16
F16
[3, 3, 512, 512]
first_stage_model.encoder.mid.block_2.norm1.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.norm1.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.norm2.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.mid.block_2.norm2.weight
Q4_0
Q4_0
[512]
first_stage_model.encoder.norm_out.bias
Q4_0
Q4_0
[512]
first_stage_model.encoder.norm_out.weight
Q4_0
Q4_0
[512]
first_stage_model.post_quant_conv.bias
F16
F16
[4]
first_stage_model.post_quant_conv.weight
F16
F16
[1, 1, 4, 4]
first_stage_model.quant_conv.bias
F16
F16
[8]
first_stage_model.quant_conv.weight
F16
F16
[1, 1, 8, 8]
model.diffusion_model.input_blocks.0.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.0.0.weight
F16
F16
[3, 3, 4, 320]
model.diffusion_model.input_blocks.1.0.emb_layers.1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.input_blocks.1.0.in_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.in_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.in_layers.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.in_layers.2.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.input_blocks.1.0.out_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.out_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.out_layers.3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.0.out_layers.3.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.input_blocks.1.1.norm.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.norm.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.proj_in.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.proj_in.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.input_blocks.1.1.proj_out.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.proj_out.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[320, 2560]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.1.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.emb_layers.1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.input_blocks.2.0.in_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.in_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.in_layers.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.in_layers.2.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.input_blocks.2.0.out_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.out_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.out_layers.3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.0.out_layers.3.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.input_blocks.2.1.norm.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.norm.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.proj_in.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.proj_in.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.input_blocks.2.1.proj_out.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.proj_out.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[320, 2560]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.2.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.3.0.op.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.3.0.op.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.input_blocks.4.0.emb_layers.1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 640]
model.diffusion_model.input_blocks.4.0.in_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.4.0.in_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.input_blocks.4.0.in_layers.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.in_layers.2.weight
F16
F16
[3, 3, 320, 640]
model.diffusion_model.input_blocks.4.0.out_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.out_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.out_layers.3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.out_layers.3.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.input_blocks.4.0.skip_connection.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.0.skip_connection.weight
F16
F16
[1, 1, 320, 640]
model.diffusion_model.input_blocks.4.1.norm.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.norm.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.proj_in.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.proj_in.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.input_blocks.4.1.proj_out.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.proj_out.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[5120]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[640, 5120]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[2560, 640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.4.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.emb_layers.1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 640]
model.diffusion_model.input_blocks.5.0.in_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.in_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.in_layers.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.in_layers.2.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.input_blocks.5.0.out_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.out_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.out_layers.3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.0.out_layers.3.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.input_blocks.5.1.norm.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.norm.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.proj_in.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.proj_in.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.input_blocks.5.1.proj_out.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.proj_out.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[5120]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[640, 5120]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[2560, 640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.5.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.6.0.op.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.6.0.op.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.input_blocks.7.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.0.in_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.7.0.in_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.input_blocks.7.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.in_layers.2.weight
F16
F16
[3, 3, 640, 1280]
model.diffusion_model.input_blocks.7.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.7.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.0.skip_connection.weight
F16
F16
[1, 1, 640, 1280]
model.diffusion_model.input_blocks.7.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.input_blocks.7.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.7.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.0.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.in_layers.2.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.8.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.8.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.input_blocks.8.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.8.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.9.0.op.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.9.0.op.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.10.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.10.0.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.in_layers.2.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.10.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.10.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.11.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.input_blocks.11.0.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.in_layers.2.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.input_blocks.11.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.input_blocks.11.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.middle_block.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.0.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.in_layers.2.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.middle_block.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.middle_block.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.middle_block.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.middle_block.2.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.in_layers.2.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.middle_block.2.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.middle_block.2.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.out.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.out.2.bias
F16
F16
[4]
model.diffusion_model.out.2.weight
F16
F16
[3, 3, 320, 4]
model.diffusion_model.output_blocks.0.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.0.0.in_layers.0.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.0.0.in_layers.0.weight
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.0.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.in_layers.2.weight
F16
F16
[3, 3, 2560, 1280]
model.diffusion_model.output_blocks.0.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.0.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.0.0.skip_connection.weight
F16
F16
[1, 1, 2560, 1280]
model.diffusion_model.output_blocks.1.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.1.0.in_layers.0.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.1.0.in_layers.0.weight
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.1.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.in_layers.2.weight
F16
F16
[3, 3, 2560, 1280]
model.diffusion_model.output_blocks.1.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.1.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.1.0.skip_connection.weight
F16
F16
[1, 1, 2560, 1280]
model.diffusion_model.output_blocks.2.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.2.0.in_layers.0.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.2.0.in_layers.0.weight
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.2.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.in_layers.2.weight
F16
F16
[3, 3, 2560, 1280]
model.diffusion_model.output_blocks.2.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.2.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.0.skip_connection.weight
F16
F16
[1, 1, 2560, 1280]
model.diffusion_model.output_blocks.2.1.conv.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.2.1.conv.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.3.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.0.in_layers.0.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.3.0.in_layers.0.weight
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.3.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.in_layers.2.weight
F16
F16
[3, 3, 2560, 1280]
model.diffusion_model.output_blocks.3.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.3.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.0.skip_connection.weight
F16
F16
[1, 1, 2560, 1280]
model.diffusion_model.output_blocks.3.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.3.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.3.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.0.in_layers.0.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.4.0.in_layers.0.weight
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.4.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.in_layers.2.weight
F16
F16
[3, 3, 2560, 1280]
model.diffusion_model.output_blocks.4.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.4.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.0.skip_connection.weight
F16
F16
[1, 1, 2560, 1280]
model.diffusion_model.output_blocks.4.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.4.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.4.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.emb_layers.1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.0.in_layers.0.bias
Q4_0
Q4_0
[1920]
model.diffusion_model.output_blocks.5.0.in_layers.0.weight
Q4_0
Q4_0
[1920]
model.diffusion_model.output_blocks.5.0.in_layers.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.in_layers.2.weight
F16
F16
[3, 3, 1920, 1280]
model.diffusion_model.output_blocks.5.0.out_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.out_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.out_layers.3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.out_layers.3.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.5.0.skip_connection.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.0.skip_connection.weight
F16
F16
[1, 1, 1920, 1280]
model.diffusion_model.output_blocks.5.1.norm.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.norm.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.proj_in.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.proj_in.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.5.1.proj_out.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.proj_out.weight
F16
F16
[1, 1, 1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[1280, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[10240]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[1280, 10240]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[5120, 1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.2.conv.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.5.2.conv.weight
F16
F16
[3, 3, 1280, 1280]
model.diffusion_model.output_blocks.6.0.emb_layers.1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 640]
model.diffusion_model.output_blocks.6.0.in_layers.0.bias
Q4_0
Q4_0
[1920]
model.diffusion_model.output_blocks.6.0.in_layers.0.weight
Q4_0
Q4_0
[1920]
model.diffusion_model.output_blocks.6.0.in_layers.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.in_layers.2.weight
F16
F16
[3, 3, 1920, 640]
model.diffusion_model.output_blocks.6.0.out_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.out_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.out_layers.3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.out_layers.3.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.output_blocks.6.0.skip_connection.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.0.skip_connection.weight
F16
F16
[1, 1, 1920, 640]
model.diffusion_model.output_blocks.6.1.norm.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.norm.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.proj_in.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.proj_in.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.6.1.proj_out.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.proj_out.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[5120]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[640, 5120]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[2560, 640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.6.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.emb_layers.1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 640]
model.diffusion_model.output_blocks.7.0.in_layers.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.7.0.in_layers.0.weight
Q4_0
Q4_0
[1280]
model.diffusion_model.output_blocks.7.0.in_layers.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.in_layers.2.weight
F16
F16
[3, 3, 1280, 640]
model.diffusion_model.output_blocks.7.0.out_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.out_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.out_layers.3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.out_layers.3.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.output_blocks.7.0.skip_connection.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.0.skip_connection.weight
F16
F16
[1, 1, 1280, 640]
model.diffusion_model.output_blocks.7.1.norm.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.norm.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.proj_in.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.proj_in.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.7.1.proj_out.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.proj_out.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[5120]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[640, 5120]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[2560, 640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.7.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.emb_layers.1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 640]
model.diffusion_model.output_blocks.8.0.in_layers.0.bias
Q4_0
Q4_0
[960]
model.diffusion_model.output_blocks.8.0.in_layers.0.weight
Q4_0
Q4_0
[960]
model.diffusion_model.output_blocks.8.0.in_layers.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.in_layers.2.weight
F16
F16
[3, 3, 960, 640]
model.diffusion_model.output_blocks.8.0.out_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.out_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.out_layers.3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.out_layers.3.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.output_blocks.8.0.skip_connection.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.0.skip_connection.weight
F16
F16
[1, 1, 960, 640]
model.diffusion_model.output_blocks.8.1.norm.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.norm.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.proj_in.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.proj_in.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.8.1.proj_out.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.proj_out.weight
F16
F16
[1, 1, 640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[640, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[5120]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[640, 5120]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[2560, 640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.2.conv.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.8.2.conv.weight
F16
F16
[3, 3, 640, 640]
model.diffusion_model.output_blocks.9.0.emb_layers.1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.9.0.in_layers.0.bias
Q4_0
Q4_0
[960]
model.diffusion_model.output_blocks.9.0.in_layers.0.weight
Q4_0
Q4_0
[960]
model.diffusion_model.output_blocks.9.0.in_layers.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.in_layers.2.weight
F16
F16
[3, 3, 960, 320]
model.diffusion_model.output_blocks.9.0.out_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.out_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.out_layers.3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.out_layers.3.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.output_blocks.9.0.skip_connection.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.0.skip_connection.weight
F16
F16
[1, 1, 960, 320]
model.diffusion_model.output_blocks.9.1.norm.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.norm.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.proj_in.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.proj_in.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.9.1.proj_out.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.proj_out.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[320, 2560]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.9.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.emb_layers.1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.10.0.in_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.10.0.in_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.10.0.in_layers.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.in_layers.2.weight
F16
F16
[3, 3, 640, 320]
model.diffusion_model.output_blocks.10.0.out_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.out_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.out_layers.3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.out_layers.3.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.output_blocks.10.0.skip_connection.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.0.skip_connection.weight
F16
F16
[1, 1, 640, 320]
model.diffusion_model.output_blocks.10.1.norm.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.norm.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.proj_in.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.proj_in.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.10.1.proj_out.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.proj_out.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[320, 2560]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.10.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.emb_layers.1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.emb_layers.1.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.11.0.in_layers.0.bias
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.11.0.in_layers.0.weight
Q4_0
Q4_0
[640]
model.diffusion_model.output_blocks.11.0.in_layers.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.in_layers.2.weight
F16
F16
[3, 3, 640, 320]
model.diffusion_model.output_blocks.11.0.out_layers.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.out_layers.0.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.out_layers.3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.out_layers.3.weight
F16
F16
[3, 3, 320, 320]
model.diffusion_model.output_blocks.11.0.skip_connection.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.0.skip_connection.weight
F16
F16
[1, 1, 640, 320]
model.diffusion_model.output_blocks.11.1.norm.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.norm.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.proj_in.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.proj_in.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.11.1.proj_out.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.proj_out.weight
F16
F16
[1, 1, 320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn1.to_k.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn1.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn1.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn1.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn1.to_v.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn2.to_k.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn2.to_out.0.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn2.to_out.0.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn2.to_q.weight
Q4_0
Q4_0
[320, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.attn2.to_v.weight
Q4_0
Q4_0
[768, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.ff.net.0.proj.bias
Q4_0
Q4_0
[2560]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.ff.net.0.proj.weight
Q4_0
Q4_0
[320, 2560]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.ff.net.2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.ff.net.2.weight
Q4_0
Q4_0
[1280, 320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm1.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm1.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm2.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm2.weight
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm3.bias
Q4_0
Q4_0
[320]
model.diffusion_model.output_blocks.11.1.transformer_blocks.0.norm3.weight
Q4_0
Q4_0
[320]
model.diffusion_model.time_embed.0.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.time_embed.0.weight
Q4_0
Q4_0
[320, 1280]
model.diffusion_model.time_embed.2.bias
Q4_0
Q4_0
[1280]
model.diffusion_model.time_embed.2.weight
Q4_0
Q4_0
[1280, 1280]