Writer/Palmyra-Med-70B-32K in Ollama
66 Pulls Updated 2 months ago
0731926d5c50 · 18GB
-
split.count2
-
split.no1
-
split.tensors.count723
-
NameTypeShape
-
blk.55.attn_k.weightQ6_K[8192, 1024]
-
blk.55.attn_output.weightQ6_K[8192, 8192]
-
blk.55.attn_q.weightQ6_K[8192, 8192]
-
blk.55.attn_v.weightQ6_K[8192, 1024]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weightQ6_K[8192, 28672]
-
blk.56.attn_k.weightQ6_K[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weightQ6_K[8192, 8192]
-
blk.56.attn_q.weightQ6_K[8192, 8192]
-
blk.56.attn_v.weightQ6_K[8192, 1024]
-
blk.56.ffn_down.weightQ6_K[28672, 8192]
-
blk.56.ffn_gate.weightQ6_K[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weightQ6_K[8192, 28672]
-
blk.57.attn_k.weightQ6_K[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weightQ6_K[8192, 8192]
-
blk.57.attn_q.weightQ6_K[8192, 8192]
-
blk.57.attn_v.weightQ6_K[8192, 1024]
-
blk.57.ffn_down.weightQ6_K[28672, 8192]
-
blk.57.ffn_gate.weightQ6_K[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weightQ6_K[8192, 28672]
-
blk.58.attn_k.weightQ6_K[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weightQ6_K[8192, 8192]
-
blk.58.attn_q.weightQ6_K[8192, 8192]
-
blk.58.attn_v.weightQ6_K[8192, 1024]
-
blk.58.ffn_down.weightQ6_K[28672, 8192]
-
blk.58.ffn_gate.weightQ6_K[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weightQ6_K[8192, 28672]
-
blk.59.attn_k.weightQ6_K[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weightQ6_K[8192, 8192]
-
blk.59.attn_q.weightQ6_K[8192, 8192]
-
blk.59.attn_v.weightQ6_K[8192, 1024]
-
blk.59.ffn_down.weightQ6_K[28672, 8192]
-
blk.59.ffn_gate.weightQ6_K[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weightQ6_K[8192, 28672]
-
blk.60.attn_k.weightQ6_K[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weightQ6_K[8192, 8192]
-
blk.60.attn_q.weightQ6_K[8192, 8192]
-
blk.60.attn_v.weightQ6_K[8192, 1024]
-
blk.60.ffn_down.weightQ6_K[28672, 8192]
-
blk.60.ffn_gate.weightQ6_K[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weightQ6_K[8192, 28672]
-
blk.61.attn_k.weightQ6_K[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weightQ6_K[8192, 8192]
-
blk.61.attn_q.weightQ6_K[8192, 8192]
-
blk.61.attn_v.weightQ6_K[8192, 1024]
-
blk.61.ffn_down.weightQ6_K[28672, 8192]
-
blk.61.ffn_gate.weightQ6_K[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weightQ6_K[8192, 28672]
-
blk.62.attn_k.weightQ6_K[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weightQ6_K[8192, 8192]
-
blk.62.attn_q.weightQ6_K[8192, 8192]
-
blk.62.attn_v.weightQ6_K[8192, 1024]
-
blk.62.ffn_down.weightQ6_K[28672, 8192]
-
blk.62.ffn_gate.weightQ6_K[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weightQ6_K[8192, 28672]
-
blk.63.attn_k.weightQ6_K[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weightQ6_K[8192, 8192]
-
blk.63.attn_q.weightQ6_K[8192, 8192]
-
blk.63.attn_v.weightQ6_K[8192, 1024]
-
blk.63.ffn_down.weightQ6_K[28672, 8192]
-
blk.63.ffn_gate.weightQ6_K[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weightQ6_K[8192, 28672]
-
blk.64.attn_k.weightQ6_K[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weightQ6_K[8192, 8192]
-
blk.64.attn_q.weightQ6_K[8192, 8192]
-
blk.64.attn_v.weightQ6_K[8192, 1024]
-
blk.64.ffn_down.weightQ6_K[28672, 8192]
-
blk.64.ffn_gate.weightQ6_K[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weightQ6_K[8192, 28672]
-
blk.65.attn_k.weightQ6_K[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weightQ6_K[8192, 8192]
-
blk.65.attn_q.weightQ6_K[8192, 8192]
-
blk.65.attn_v.weightQ6_K[8192, 1024]
-
blk.65.ffn_down.weightQ6_K[28672, 8192]
-
blk.65.ffn_gate.weightQ6_K[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weightQ6_K[8192, 28672]
-
blk.66.attn_k.weightQ6_K[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weightQ6_K[8192, 8192]
-
blk.66.attn_q.weightQ6_K[8192, 8192]
-
blk.66.attn_v.weightQ6_K[8192, 1024]
-
blk.66.ffn_down.weightQ6_K[28672, 8192]
-
blk.66.ffn_gate.weightQ6_K[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weightQ6_K[8192, 28672]
-
blk.67.attn_k.weightQ6_K[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weightQ6_K[8192, 8192]
-
blk.67.attn_q.weightQ6_K[8192, 8192]
-
blk.67.attn_v.weightQ6_K[8192, 1024]
-
blk.67.ffn_down.weightQ6_K[28672, 8192]
-
blk.67.ffn_gate.weightQ6_K[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weightQ6_K[8192, 28672]
-
blk.68.attn_k.weightQ6_K[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weightQ6_K[8192, 8192]
-
blk.68.attn_q.weightQ6_K[8192, 8192]
-
blk.68.attn_v.weightQ6_K[8192, 1024]
-
blk.68.ffn_down.weightQ6_K[28672, 8192]
-
blk.68.ffn_gate.weightQ6_K[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weightQ6_K[8192, 28672]
-
blk.69.attn_k.weightQ6_K[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weightQ6_K[8192, 8192]
-
blk.69.attn_q.weightQ6_K[8192, 8192]
-
blk.69.attn_v.weightQ6_K[8192, 1024]
-
blk.69.ffn_down.weightQ6_K[28672, 8192]
-
blk.69.ffn_gate.weightQ6_K[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weightQ6_K[8192, 28672]
-
blk.70.attn_k.weightQ6_K[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weightQ6_K[8192, 8192]
-
blk.70.attn_q.weightQ6_K[8192, 8192]
-
blk.70.attn_v.weightQ6_K[8192, 1024]
-
blk.70.ffn_down.weightQ6_K[28672, 8192]
-
blk.70.ffn_gate.weightQ6_K[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weightQ6_K[8192, 28672]
-
blk.71.attn_k.weightQ6_K[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weightQ6_K[8192, 8192]
-
blk.71.attn_q.weightQ6_K[8192, 8192]
-
blk.71.attn_v.weightQ6_K[8192, 1024]
-
blk.71.ffn_down.weightQ6_K[28672, 8192]
-
blk.71.ffn_gate.weightQ6_K[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weightQ6_K[8192, 28672]
-
blk.72.attn_k.weightQ6_K[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weightQ6_K[8192, 8192]
-
blk.72.attn_q.weightQ6_K[8192, 8192]
-
blk.72.attn_v.weightQ6_K[8192, 1024]
-
blk.72.ffn_down.weightQ6_K[28672, 8192]
-
blk.72.ffn_gate.weightQ6_K[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weightQ6_K[8192, 28672]
-
blk.73.attn_k.weightQ6_K[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weightQ6_K[8192, 8192]
-
blk.73.attn_q.weightQ6_K[8192, 8192]
-
blk.73.attn_v.weightQ6_K[8192, 1024]
-
blk.73.ffn_down.weightQ6_K[28672, 8192]
-
blk.73.ffn_gate.weightQ6_K[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weightQ6_K[8192, 28672]
-
blk.74.attn_k.weightQ6_K[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weightQ6_K[8192, 8192]
-
blk.74.attn_q.weightQ6_K[8192, 8192]
-
blk.74.attn_v.weightQ6_K[8192, 1024]
-
blk.74.ffn_down.weightQ6_K[28672, 8192]
-
blk.74.ffn_gate.weightQ6_K[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weightQ6_K[8192, 28672]
-
blk.75.attn_k.weightQ6_K[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weightQ6_K[8192, 8192]
-
blk.75.attn_q.weightQ6_K[8192, 8192]
-
blk.75.attn_v.weightQ6_K[8192, 1024]
-
blk.75.ffn_down.weightQ6_K[28672, 8192]
-
blk.75.ffn_gate.weightQ6_K[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weightQ6_K[8192, 28672]
-
blk.76.attn_k.weightQ6_K[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weightQ6_K[8192, 8192]
-
blk.76.attn_q.weightQ6_K[8192, 8192]
-
blk.76.attn_v.weightQ6_K[8192, 1024]
-
blk.76.ffn_down.weightQ6_K[28672, 8192]
-
blk.76.ffn_gate.weightQ6_K[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weightQ6_K[8192, 28672]
-
blk.77.attn_k.weightQ6_K[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ6_K[8192, 8192]
-
blk.77.attn_q.weightQ6_K[8192, 8192]
-
blk.77.attn_v.weightQ6_K[8192, 1024]
-
blk.77.ffn_down.weightQ6_K[28672, 8192]
-
blk.77.ffn_gate.weightQ6_K[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weightQ6_K[8192, 28672]
-
blk.78.attn_k.weightQ6_K[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weightQ6_K[8192, 8192]
-
blk.78.attn_q.weightQ6_K[8192, 8192]
-
blk.78.attn_v.weightQ6_K[8192, 1024]
-
blk.78.ffn_down.weightQ6_K[28672, 8192]
-
blk.78.ffn_gate.weightQ6_K[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weightQ6_K[8192, 28672]
-
blk.79.attn_k.weightQ6_K[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weightQ6_K[8192, 8192]
-
blk.79.attn_q.weightQ6_K[8192, 8192]
-
blk.79.attn_v.weightQ6_K[8192, 1024]
-
blk.79.ffn_down.weightQ6_K[28672, 8192]
-
blk.79.ffn_gate.weightQ6_K[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weightQ6_K[8192, 28672]
-
output.weightQ6_K[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79