Writer/Palmyra-Med-70B-32K in Ollama

63 2 months ago

f9fef2fa2788 · 35GB
    Metadata
  • split.count
    2
  • split.no
    1
  • split.tensors.count
    723
  • Tensor
  • Name
    Type
    Shape
  • blk.42
  • blk.42.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.42.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.42.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.42.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.42.ffn_norm.weight
    F32
    [8192]
  • blk.42.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.43
  • blk.43.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.43.attn_norm.weight
    F32
    [8192]
  • blk.43.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.43.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.43.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.43.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.43.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.43.ffn_norm.weight
    F32
    [8192]
  • blk.43.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.44
  • blk.44.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.44.attn_norm.weight
    F32
    [8192]
  • blk.44.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.44.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.44.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.44.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.44.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.44.ffn_norm.weight
    F32
    [8192]
  • blk.44.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.45
  • blk.45.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.45.attn_norm.weight
    F32
    [8192]
  • blk.45.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.45.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.45.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.45.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.45.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.45.ffn_norm.weight
    F32
    [8192]
  • blk.45.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.46
  • blk.46.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.46.attn_norm.weight
    F32
    [8192]
  • blk.46.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.46.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.46.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.46.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.46.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.46.ffn_norm.weight
    F32
    [8192]
  • blk.46.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.47
  • blk.47.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.47.attn_norm.weight
    F32
    [8192]
  • blk.47.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.47.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.47.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.47.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.47.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.47.ffn_norm.weight
    F32
    [8192]
  • blk.47.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.48
  • blk.48.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.48.attn_norm.weight
    F32
    [8192]
  • blk.48.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.48.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.48.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.48.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.48.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.48.ffn_norm.weight
    F32
    [8192]
  • blk.48.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.49
  • blk.49.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.49.attn_norm.weight
    F32
    [8192]
  • blk.49.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.49.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.49.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.49.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.49.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.49.ffn_norm.weight
    F32
    [8192]
  • blk.49.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.50
  • blk.50.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.50.attn_norm.weight
    F32
    [8192]
  • blk.50.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.50.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.50.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.50.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.50.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.50.ffn_norm.weight
    F32
    [8192]
  • blk.50.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.51
  • blk.51.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.51.attn_norm.weight
    F32
    [8192]
  • blk.51.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.51.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.51.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.51.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.51.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.51.ffn_norm.weight
    F32
    [8192]
  • blk.51.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.52
  • blk.52.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.52.attn_norm.weight
    F32
    [8192]
  • blk.52.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.52.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.52.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.52.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.52.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.52.ffn_norm.weight
    F32
    [8192]
  • blk.52.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.53
  • blk.53.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.53.attn_norm.weight
    F32
    [8192]
  • blk.53.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.53.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.53.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.53.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.53.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.53.ffn_norm.weight
    F32
    [8192]
  • blk.53.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.54
  • blk.54.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.54.attn_norm.weight
    F32
    [8192]
  • blk.54.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.54.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.54.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.54.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.54.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.54.ffn_norm.weight
    F32
    [8192]
  • blk.54.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.55
  • blk.55.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.55.attn_norm.weight
    F32
    [8192]
  • blk.55.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.55.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.55.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.55.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.55.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.55.ffn_norm.weight
    F32
    [8192]
  • blk.55.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.56
  • blk.56.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.56.attn_norm.weight
    F32
    [8192]
  • blk.56.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.56.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.56.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.56.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.56.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.56.ffn_norm.weight
    F32
    [8192]
  • blk.56.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.57
  • blk.57.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.57.attn_norm.weight
    F32
    [8192]
  • blk.57.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.57.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.57.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.57.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.57.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.57.ffn_norm.weight
    F32
    [8192]
  • blk.57.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.58
  • blk.58.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.58.attn_norm.weight
    F32
    [8192]
  • blk.58.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.58.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.58.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.58.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.58.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.58.ffn_norm.weight
    F32
    [8192]
  • blk.58.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.59
  • blk.59.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.59.attn_norm.weight
    F32
    [8192]
  • blk.59.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.59.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.59.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.59.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.59.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.59.ffn_norm.weight
    F32
    [8192]
  • blk.59.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.60
  • blk.60.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.60.attn_norm.weight
    F32
    [8192]
  • blk.60.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.60.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.60.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.60.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.60.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.60.ffn_norm.weight
    F32
    [8192]
  • blk.60.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.61
  • blk.61.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.61.attn_norm.weight
    F32
    [8192]
  • blk.61.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.61.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.61.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.61.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.61.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.61.ffn_norm.weight
    F32
    [8192]
  • blk.61.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.62
  • blk.62.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.62.attn_norm.weight
    F32
    [8192]
  • blk.62.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.62.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.62.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.62.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.62.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.62.ffn_norm.weight
    F32
    [8192]
  • blk.62.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.63
  • blk.63.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.63.attn_norm.weight
    F32
    [8192]
  • blk.63.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.63.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.63.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.63.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.63.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.63.ffn_norm.weight
    F32
    [8192]
  • blk.63.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.64
  • blk.64.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.64.attn_norm.weight
    F32
    [8192]
  • blk.64.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.64.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.64.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.64.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.64.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.64.ffn_norm.weight
    F32
    [8192]
  • blk.64.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.65
  • blk.65.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.65.attn_norm.weight
    F32
    [8192]
  • blk.65.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.65.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.65.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.65.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.65.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.65.ffn_norm.weight
    F32
    [8192]
  • blk.65.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.66
  • blk.66.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.66.attn_norm.weight
    F32
    [8192]
  • blk.66.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.66.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.66.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.66.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.66.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.66.ffn_norm.weight
    F32
    [8192]
  • blk.66.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.67
  • blk.67.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.67.attn_norm.weight
    F32
    [8192]
  • blk.67.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.67.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.67.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.67.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.67.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.67.ffn_norm.weight
    F32
    [8192]
  • blk.67.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.68
  • blk.68.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.68.attn_norm.weight
    F32
    [8192]
  • blk.68.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.68.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.68.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.68.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.68.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.68.ffn_norm.weight
    F32
    [8192]
  • blk.68.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.69
  • blk.69.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.69.attn_norm.weight
    F32
    [8192]
  • blk.69.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.69.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.69.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.69.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.69.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.69.ffn_norm.weight
    F32
    [8192]
  • blk.69.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.70
  • blk.70.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.70.attn_norm.weight
    F32
    [8192]
  • blk.70.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.70.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.70.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.70.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.70.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.70.ffn_norm.weight
    F32
    [8192]
  • blk.70.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.71
  • blk.71.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.71.attn_norm.weight
    F32
    [8192]
  • blk.71.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.71.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.71.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.71.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.71.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.71.ffn_norm.weight
    F32
    [8192]
  • blk.71.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.72
  • blk.72.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.72.attn_norm.weight
    F32
    [8192]
  • blk.72.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.72.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.72.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.72.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.72.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.72.ffn_norm.weight
    F32
    [8192]
  • blk.72.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.73
  • blk.73.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.73.attn_norm.weight
    F32
    [8192]
  • blk.73.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.73.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.73.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.73.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.73.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.73.ffn_norm.weight
    F32
    [8192]
  • blk.73.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.74
  • blk.74.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.74.attn_norm.weight
    F32
    [8192]
  • blk.74.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.74.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.74.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.74.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.74.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.74.ffn_norm.weight
    F32
    [8192]
  • blk.74.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.75
  • blk.75.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.75.attn_norm.weight
    F32
    [8192]
  • blk.75.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.75.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.75.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.75.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.75.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.75.ffn_norm.weight
    F32
    [8192]
  • blk.75.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.76
  • blk.76.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.76.attn_norm.weight
    F32
    [8192]
  • blk.76.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.76.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.76.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.76.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.76.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.76.ffn_norm.weight
    F32
    [8192]
  • blk.76.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.77
  • blk.77.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.77.attn_norm.weight
    F32
    [8192]
  • blk.77.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.77.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.77.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.77.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.77.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.77.ffn_norm.weight
    F32
    [8192]
  • blk.77.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.78
  • blk.78.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.78.attn_norm.weight
    F32
    [8192]
  • blk.78.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.78.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.78.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.78.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.78.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.78.ffn_norm.weight
    F32
    [8192]
  • blk.78.ffn_up.weight
    Q8_0
    [8192, 28672]
  • blk.79
  • blk.79.attn_k.weight
    Q8_0
    [8192, 1024]
  • blk.79.attn_norm.weight
    F32
    [8192]
  • blk.79.attn_output.weight
    Q8_0
    [8192, 8192]
  • blk.79.attn_q.weight
    Q8_0
    [8192, 8192]
  • blk.79.attn_v.weight
    Q8_0
    [8192, 1024]
  • blk.79.ffn_down.weight
    Q8_0
    [28672, 8192]
  • blk.79.ffn_gate.weight
    Q8_0
    [8192, 28672]
  • blk.79.ffn_norm.weight
    F32
    [8192]
  • blk.79.ffn_up.weight
    Q8_0
    [8192, 28672]
  • output.weight
    Q8_0
    [8192, 128256]
  • output_norm.weight
    F32
    [8192]