Writer/Palmyra-Med-70B-32K in Ollama
63 Pulls Updated 2 months ago
f9fef2fa2788 · 35GB
-
split.count2
-
split.no1
-
split.tensors.count723
-
NameTypeShape
-
blk.42.attn_k.weightQ8_0[8192, 1024]
-
blk.42.attn_output.weightQ8_0[8192, 8192]
-
blk.42.attn_q.weightQ8_0[8192, 8192]
-
blk.42.attn_v.weightQ8_0[8192, 1024]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weightQ8_0[8192, 28672]
-
blk.43.attn_k.weightQ8_0[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weightQ8_0[8192, 8192]
-
blk.43.attn_q.weightQ8_0[8192, 8192]
-
blk.43.attn_v.weightQ8_0[8192, 1024]
-
blk.43.ffn_down.weightQ8_0[28672, 8192]
-
blk.43.ffn_gate.weightQ8_0[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weightQ8_0[8192, 28672]
-
blk.44.attn_k.weightQ8_0[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weightQ8_0[8192, 8192]
-
blk.44.attn_q.weightQ8_0[8192, 8192]
-
blk.44.attn_v.weightQ8_0[8192, 1024]
-
blk.44.ffn_down.weightQ8_0[28672, 8192]
-
blk.44.ffn_gate.weightQ8_0[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weightQ8_0[8192, 28672]
-
blk.45.attn_k.weightQ8_0[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weightQ8_0[8192, 8192]
-
blk.45.attn_q.weightQ8_0[8192, 8192]
-
blk.45.attn_v.weightQ8_0[8192, 1024]
-
blk.45.ffn_down.weightQ8_0[28672, 8192]
-
blk.45.ffn_gate.weightQ8_0[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weightQ8_0[8192, 28672]
-
blk.46.attn_k.weightQ8_0[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weightQ8_0[8192, 8192]
-
blk.46.attn_q.weightQ8_0[8192, 8192]
-
blk.46.attn_v.weightQ8_0[8192, 1024]
-
blk.46.ffn_down.weightQ8_0[28672, 8192]
-
blk.46.ffn_gate.weightQ8_0[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weightQ8_0[8192, 28672]
-
blk.47.attn_k.weightQ8_0[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weightQ8_0[8192, 8192]
-
blk.47.attn_q.weightQ8_0[8192, 8192]
-
blk.47.attn_v.weightQ8_0[8192, 1024]
-
blk.47.ffn_down.weightQ8_0[28672, 8192]
-
blk.47.ffn_gate.weightQ8_0[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weightQ8_0[8192, 28672]
-
blk.48.attn_k.weightQ8_0[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weightQ8_0[8192, 8192]
-
blk.48.attn_q.weightQ8_0[8192, 8192]
-
blk.48.attn_v.weightQ8_0[8192, 1024]
-
blk.48.ffn_down.weightQ8_0[28672, 8192]
-
blk.48.ffn_gate.weightQ8_0[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weightQ8_0[8192, 28672]
-
blk.49.attn_k.weightQ8_0[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weightQ8_0[8192, 8192]
-
blk.49.attn_q.weightQ8_0[8192, 8192]
-
blk.49.attn_v.weightQ8_0[8192, 1024]
-
blk.49.ffn_down.weightQ8_0[28672, 8192]
-
blk.49.ffn_gate.weightQ8_0[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weightQ8_0[8192, 28672]
-
blk.50.attn_k.weightQ8_0[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weightQ8_0[8192, 8192]
-
blk.50.attn_q.weightQ8_0[8192, 8192]
-
blk.50.attn_v.weightQ8_0[8192, 1024]
-
blk.50.ffn_down.weightQ8_0[28672, 8192]
-
blk.50.ffn_gate.weightQ8_0[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weightQ8_0[8192, 28672]
-
blk.51.attn_k.weightQ8_0[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weightQ8_0[8192, 8192]
-
blk.51.attn_q.weightQ8_0[8192, 8192]
-
blk.51.attn_v.weightQ8_0[8192, 1024]
-
blk.51.ffn_down.weightQ8_0[28672, 8192]
-
blk.51.ffn_gate.weightQ8_0[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weightQ8_0[8192, 28672]
-
blk.52.attn_k.weightQ8_0[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weightQ8_0[8192, 8192]
-
blk.52.attn_q.weightQ8_0[8192, 8192]
-
blk.52.attn_v.weightQ8_0[8192, 1024]
-
blk.52.ffn_down.weightQ8_0[28672, 8192]
-
blk.52.ffn_gate.weightQ8_0[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weightQ8_0[8192, 28672]
-
blk.53.attn_k.weightQ8_0[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weightQ8_0[8192, 8192]
-
blk.53.attn_q.weightQ8_0[8192, 8192]
-
blk.53.attn_v.weightQ8_0[8192, 1024]
-
blk.53.ffn_down.weightQ8_0[28672, 8192]
-
blk.53.ffn_gate.weightQ8_0[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weightQ8_0[8192, 28672]
-
blk.54.attn_k.weightQ8_0[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weightQ8_0[8192, 8192]
-
blk.54.attn_q.weightQ8_0[8192, 8192]
-
blk.54.attn_v.weightQ8_0[8192, 1024]
-
blk.54.ffn_down.weightQ8_0[28672, 8192]
-
blk.54.ffn_gate.weightQ8_0[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weightQ8_0[8192, 28672]
-
blk.55.attn_k.weightQ8_0[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weightQ8_0[8192, 8192]
-
blk.55.attn_q.weightQ8_0[8192, 8192]
-
blk.55.attn_v.weightQ8_0[8192, 1024]
-
blk.55.ffn_down.weightQ8_0[28672, 8192]
-
blk.55.ffn_gate.weightQ8_0[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weightQ8_0[8192, 28672]
-
blk.56.attn_k.weightQ8_0[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weightQ8_0[8192, 8192]
-
blk.56.attn_q.weightQ8_0[8192, 8192]
-
blk.56.attn_v.weightQ8_0[8192, 1024]
-
blk.56.ffn_down.weightQ8_0[28672, 8192]
-
blk.56.ffn_gate.weightQ8_0[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weightQ8_0[8192, 28672]
-
blk.57.attn_k.weightQ8_0[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weightQ8_0[8192, 8192]
-
blk.57.attn_q.weightQ8_0[8192, 8192]
-
blk.57.attn_v.weightQ8_0[8192, 1024]
-
blk.57.ffn_down.weightQ8_0[28672, 8192]
-
blk.57.ffn_gate.weightQ8_0[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weightQ8_0[8192, 28672]
-
blk.58.attn_k.weightQ8_0[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weightQ8_0[8192, 8192]
-
blk.58.attn_q.weightQ8_0[8192, 8192]
-
blk.58.attn_v.weightQ8_0[8192, 1024]
-
blk.58.ffn_down.weightQ8_0[28672, 8192]
-
blk.58.ffn_gate.weightQ8_0[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weightQ8_0[8192, 28672]
-
blk.59.attn_k.weightQ8_0[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weightQ8_0[8192, 8192]
-
blk.59.attn_q.weightQ8_0[8192, 8192]
-
blk.59.attn_v.weightQ8_0[8192, 1024]
-
blk.59.ffn_down.weightQ8_0[28672, 8192]
-
blk.59.ffn_gate.weightQ8_0[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weightQ8_0[8192, 28672]
-
blk.60.attn_k.weightQ8_0[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weightQ8_0[8192, 8192]
-
blk.60.attn_q.weightQ8_0[8192, 8192]
-
blk.60.attn_v.weightQ8_0[8192, 1024]
-
blk.60.ffn_down.weightQ8_0[28672, 8192]
-
blk.60.ffn_gate.weightQ8_0[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weightQ8_0[8192, 28672]
-
blk.61.attn_k.weightQ8_0[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weightQ8_0[8192, 8192]
-
blk.61.attn_q.weightQ8_0[8192, 8192]
-
blk.61.attn_v.weightQ8_0[8192, 1024]
-
blk.61.ffn_down.weightQ8_0[28672, 8192]
-
blk.61.ffn_gate.weightQ8_0[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weightQ8_0[8192, 28672]
-
blk.62.attn_k.weightQ8_0[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weightQ8_0[8192, 8192]
-
blk.62.attn_q.weightQ8_0[8192, 8192]
-
blk.62.attn_v.weightQ8_0[8192, 1024]
-
blk.62.ffn_down.weightQ8_0[28672, 8192]
-
blk.62.ffn_gate.weightQ8_0[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weightQ8_0[8192, 28672]
-
blk.63.attn_k.weightQ8_0[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weightQ8_0[8192, 8192]
-
blk.63.attn_q.weightQ8_0[8192, 8192]
-
blk.63.attn_v.weightQ8_0[8192, 1024]
-
blk.63.ffn_down.weightQ8_0[28672, 8192]
-
blk.63.ffn_gate.weightQ8_0[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weightQ8_0[8192, 28672]
-
blk.64.attn_k.weightQ8_0[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weightQ8_0[8192, 8192]
-
blk.64.attn_q.weightQ8_0[8192, 8192]
-
blk.64.attn_v.weightQ8_0[8192, 1024]
-
blk.64.ffn_down.weightQ8_0[28672, 8192]
-
blk.64.ffn_gate.weightQ8_0[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weightQ8_0[8192, 28672]
-
blk.65.attn_k.weightQ8_0[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weightQ8_0[8192, 8192]
-
blk.65.attn_q.weightQ8_0[8192, 8192]
-
blk.65.attn_v.weightQ8_0[8192, 1024]
-
blk.65.ffn_down.weightQ8_0[28672, 8192]
-
blk.65.ffn_gate.weightQ8_0[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weightQ8_0[8192, 28672]
-
blk.66.attn_k.weightQ8_0[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weightQ8_0[8192, 8192]
-
blk.66.attn_q.weightQ8_0[8192, 8192]
-
blk.66.attn_v.weightQ8_0[8192, 1024]
-
blk.66.ffn_down.weightQ8_0[28672, 8192]
-
blk.66.ffn_gate.weightQ8_0[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weightQ8_0[8192, 28672]
-
blk.67.attn_k.weightQ8_0[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weightQ8_0[8192, 8192]
-
blk.67.attn_q.weightQ8_0[8192, 8192]
-
blk.67.attn_v.weightQ8_0[8192, 1024]
-
blk.67.ffn_down.weightQ8_0[28672, 8192]
-
blk.67.ffn_gate.weightQ8_0[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weightQ8_0[8192, 28672]
-
blk.68.attn_k.weightQ8_0[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weightQ8_0[8192, 8192]
-
blk.68.attn_q.weightQ8_0[8192, 8192]
-
blk.68.attn_v.weightQ8_0[8192, 1024]
-
blk.68.ffn_down.weightQ8_0[28672, 8192]
-
blk.68.ffn_gate.weightQ8_0[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weightQ8_0[8192, 28672]
-
blk.69.attn_k.weightQ8_0[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weightQ8_0[8192, 8192]
-
blk.69.attn_q.weightQ8_0[8192, 8192]
-
blk.69.attn_v.weightQ8_0[8192, 1024]
-
blk.69.ffn_down.weightQ8_0[28672, 8192]
-
blk.69.ffn_gate.weightQ8_0[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weightQ8_0[8192, 28672]
-
blk.70.attn_k.weightQ8_0[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weightQ8_0[8192, 8192]
-
blk.70.attn_q.weightQ8_0[8192, 8192]
-
blk.70.attn_v.weightQ8_0[8192, 1024]
-
blk.70.ffn_down.weightQ8_0[28672, 8192]
-
blk.70.ffn_gate.weightQ8_0[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weightQ8_0[8192, 28672]
-
blk.71.attn_k.weightQ8_0[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weightQ8_0[8192, 8192]
-
blk.71.attn_q.weightQ8_0[8192, 8192]
-
blk.71.attn_v.weightQ8_0[8192, 1024]
-
blk.71.ffn_down.weightQ8_0[28672, 8192]
-
blk.71.ffn_gate.weightQ8_0[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weightQ8_0[8192, 28672]
-
blk.72.attn_k.weightQ8_0[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weightQ8_0[8192, 8192]
-
blk.72.attn_q.weightQ8_0[8192, 8192]
-
blk.72.attn_v.weightQ8_0[8192, 1024]
-
blk.72.ffn_down.weightQ8_0[28672, 8192]
-
blk.72.ffn_gate.weightQ8_0[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weightQ8_0[8192, 28672]
-
blk.73.attn_k.weightQ8_0[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weightQ8_0[8192, 8192]
-
blk.73.attn_q.weightQ8_0[8192, 8192]
-
blk.73.attn_v.weightQ8_0[8192, 1024]
-
blk.73.ffn_down.weightQ8_0[28672, 8192]
-
blk.73.ffn_gate.weightQ8_0[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weightQ8_0[8192, 28672]
-
blk.74.attn_k.weightQ8_0[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weightQ8_0[8192, 8192]
-
blk.74.attn_q.weightQ8_0[8192, 8192]
-
blk.74.attn_v.weightQ8_0[8192, 1024]
-
blk.74.ffn_down.weightQ8_0[28672, 8192]
-
blk.74.ffn_gate.weightQ8_0[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weightQ8_0[8192, 28672]
-
blk.75.attn_k.weightQ8_0[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weightQ8_0[8192, 8192]
-
blk.75.attn_q.weightQ8_0[8192, 8192]
-
blk.75.attn_v.weightQ8_0[8192, 1024]
-
blk.75.ffn_down.weightQ8_0[28672, 8192]
-
blk.75.ffn_gate.weightQ8_0[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weightQ8_0[8192, 28672]
-
blk.76.attn_k.weightQ8_0[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weightQ8_0[8192, 8192]
-
blk.76.attn_q.weightQ8_0[8192, 8192]
-
blk.76.attn_v.weightQ8_0[8192, 1024]
-
blk.76.ffn_down.weightQ8_0[28672, 8192]
-
blk.76.ffn_gate.weightQ8_0[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weightQ8_0[8192, 28672]
-
blk.77.attn_k.weightQ8_0[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ8_0[8192, 8192]
-
blk.77.attn_q.weightQ8_0[8192, 8192]
-
blk.77.attn_v.weightQ8_0[8192, 1024]
-
blk.77.ffn_down.weightQ8_0[28672, 8192]
-
blk.77.ffn_gate.weightQ8_0[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weightQ8_0[8192, 28672]
-
blk.78.attn_k.weightQ8_0[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weightQ8_0[8192, 8192]
-
blk.78.attn_q.weightQ8_0[8192, 8192]
-
blk.78.attn_v.weightQ8_0[8192, 1024]
-
blk.78.ffn_down.weightQ8_0[28672, 8192]
-
blk.78.ffn_gate.weightQ8_0[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weightQ8_0[8192, 28672]
-
blk.79.attn_k.weightQ8_0[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weightQ8_0[8192, 8192]
-
blk.79.attn_q.weightQ8_0[8192, 8192]
-
blk.79.attn_v.weightQ8_0[8192, 1024]
-
blk.79.ffn_down.weightQ8_0[28672, 8192]
-
blk.79.ffn_gate.weightQ8_0[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weightQ8_0[8192, 28672]
-
output.weightQ8_0[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79