MaziyarPanahi/firefunction-v2-GGUF
61 Pulls Updated 4 months ago
435f8864e2de · 17GB
-
general.architecturellama
-
general.file_type31
-
general.namemodels--fireworks-ai--firefunction-v2
-
general.quantization_version2
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length8192
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
quantize.imatrix.chunks_count69
-
quantize.imatrix.datasetgroup_40.txt
-
quantize.imatrix.entries_count560
-
quantize.imatrix.file./imatrix.dat
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128255
-
tokenizer.ggml.presmaug-bpe
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
tokenizer.ggml.unknown_token_id128255
-
NameTypeShape
-
token_embd.weightQ2_K[8192, 128256]
-
blk.0.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.attn_output.weightI8[8192, 8192]
-
blk.0.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.0.attn_v.weightQ4_K[8192, 1024]
-
blk.0.ffn_down.weightQ2_K[28672, 8192]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.1.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.attn_output.weightI8[8192, 8192]
-
blk.1.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.1.attn_v.weightQ4_K[8192, 1024]
-
blk.1.ffn_down.weightQ2_K[28672, 8192]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.2.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.attn_output.weightI8[8192, 8192]
-
blk.2.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.2.attn_v.weightQ4_K[8192, 1024]
-
blk.2.ffn_down.weightQ2_K[28672, 8192]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.3.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.attn_output.weightI8[8192, 8192]
-
blk.3.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.3.attn_v.weightQ4_K[8192, 1024]
-
blk.3.ffn_down.weightQ2_K[28672, 8192]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.4.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.attn_output.weightI8[8192, 8192]
-
blk.4.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.4.attn_v.weightQ4_K[8192, 1024]
-
blk.4.ffn_down.weightQ2_K[28672, 8192]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.5.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.attn_output.weightI8[8192, 8192]
-
blk.5.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.5.attn_v.weightQ4_K[8192, 1024]
-
blk.5.ffn_down.weightQ2_K[28672, 8192]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.6.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.attn_output.weightI8[8192, 8192]
-
blk.6.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.6.attn_v.weightQ4_K[8192, 1024]
-
blk.6.ffn_down.weightQ2_K[28672, 8192]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.7.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.attn_output.weightI8[8192, 8192]
-
blk.7.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.7.attn_v.weightQ4_K[8192, 1024]
-
blk.7.ffn_down.weightQ2_K[28672, 8192]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.8.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.attn_output.weightI8[8192, 8192]
-
blk.8.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.8.attn_v.weightQ4_K[8192, 1024]
-
blk.8.ffn_down.weightQ2_K[28672, 8192]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.9.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.attn_output.weightI8[8192, 8192]
-
blk.9.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.9.attn_v.weightQ4_K[8192, 1024]
-
blk.9.ffn_down.weightQ2_K[28672, 8192]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.10.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.attn_output.weightI8[8192, 8192]
-
blk.10.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.10.attn_v.weightQ4_K[8192, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.11.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.attn_output.weightI8[8192, 8192]
-
blk.11.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.11.attn_v.weightQ4_K[8192, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.12.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.attn_output.weightI8[8192, 8192]
-
blk.12.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.12.attn_v.weightQ4_K[8192, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.13.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.attn_output.weightI8[8192, 8192]
-
blk.13.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.13.attn_v.weightQ4_K[8192, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.14.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.attn_output.weightI8[8192, 8192]
-
blk.14.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.14.attn_v.weightQ4_K[8192, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.15.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.attn_output.weightI8[8192, 8192]
-
blk.15.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.15.attn_v.weightQ4_K[8192, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.16.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.attn_output.weightI8[8192, 8192]
-
blk.16.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.16.attn_v.weightQ4_K[8192, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.17.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.attn_output.weightI8[8192, 8192]
-
blk.17.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.17.attn_v.weightQ4_K[8192, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.18.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.attn_output.weightI8[8192, 8192]
-
blk.18.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.18.attn_v.weightQ4_K[8192, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.19.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.attn_output.weightI8[8192, 8192]
-
blk.19.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.19.attn_v.weightQ4_K[8192, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.20.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.attn_output.weightI8[8192, 8192]
-
blk.20.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.20.attn_v.weightQ4_K[8192, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.21.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.attn_output.weightI8[8192, 8192]
-
blk.21.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.21.attn_v.weightQ4_K[8192, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.22.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.attn_output.weightI8[8192, 8192]
-
blk.22.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.22.attn_v.weightQ4_K[8192, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.23.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.attn_output.weightI8[8192, 8192]
-
blk.23.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.23.attn_v.weightQ4_K[8192, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.24.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.attn_output.weightI8[8192, 8192]
-
blk.24.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.24.attn_v.weightQ4_K[8192, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.25.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.attn_output.weightI8[8192, 8192]
-
blk.25.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.25.attn_v.weightQ4_K[8192, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.26.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.attn_output.weightI8[8192, 8192]
-
blk.26.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.26.attn_v.weightQ4_K[8192, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.27.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.attn_output.weightI8[8192, 8192]
-
blk.27.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.27.attn_v.weightQ4_K[8192, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.28.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.attn_output.weightI8[8192, 8192]
-
blk.28.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.28.attn_v.weightQ4_K[8192, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.29.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.attn_output.weightI8[8192, 8192]
-
blk.29.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.29.attn_v.weightQ4_K[8192, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.30.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.attn_output.weightI8[8192, 8192]
-
blk.30.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.30.attn_v.weightQ4_K[8192, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.31.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.attn_output.weightI8[8192, 8192]
-
blk.31.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.31.attn_v.weightQ4_K[8192, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.32.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.attn_output.weightI8[8192, 8192]
-
blk.32.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.32.attn_v.weightQ4_K[8192, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.33.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.attn_output.weightI8[8192, 8192]
-
blk.33.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.33.attn_v.weightQ4_K[8192, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.34.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.attn_output.weightI8[8192, 8192]
-
blk.34.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.34.attn_v.weightQ4_K[8192, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.35.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.attn_output.weightI8[8192, 8192]
-
blk.35.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.35.attn_v.weightQ4_K[8192, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.36.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.attn_output.weightI8[8192, 8192]
-
blk.36.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.36.attn_v.weightQ4_K[8192, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.37.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.attn_output.weightI8[8192, 8192]
-
blk.37.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.37.attn_v.weightQ4_K[8192, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.38.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.attn_output.weightI8[8192, 8192]
-
blk.38.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.38.attn_v.weightQ4_K[8192, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.39.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.attn_output.weightI8[8192, 8192]
-
blk.39.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.39.attn_v.weightQ4_K[8192, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.40.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.attn_output.weightI8[8192, 8192]
-
blk.40.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.40.attn_v.weightQ4_K[8192, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.41.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.attn_output.weightI8[8192, 8192]
-
blk.41.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.41.attn_v.weightQ4_K[8192, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.42.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.attn_output.weightI8[8192, 8192]
-
blk.42.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.42.attn_v.weightQ4_K[8192, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.43.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.attn_output.weightI8[8192, 8192]
-
blk.43.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.43.attn_v.weightQ4_K[8192, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.44.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.attn_output.weightI8[8192, 8192]
-
blk.44.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.44.attn_v.weightQ4_K[8192, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.45.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.attn_output.weightI8[8192, 8192]
-
blk.45.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.45.attn_v.weightQ4_K[8192, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.46.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_output.weightI8[8192, 8192]
-
blk.46.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.46.attn_v.weightQ4_K[8192, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.47.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.attn_output.weightI8[8192, 8192]
-
blk.47.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.47.attn_v.weightQ4_K[8192, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.48.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.attn_output.weightI8[8192, 8192]
-
blk.48.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.48.attn_v.weightQ4_K[8192, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.49.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.attn_output.weightI8[8192, 8192]
-
blk.49.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.49.attn_v.weightQ4_K[8192, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.50.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.attn_output.weightI8[8192, 8192]
-
blk.50.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.50.attn_v.weightQ4_K[8192, 1024]
-
blk.50.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.50.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.51.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.attn_output.weightI8[8192, 8192]
-
blk.51.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.51.attn_v.weightQ4_K[8192, 1024]
-
blk.51.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.51.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.52.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.attn_output.weightI8[8192, 8192]
-
blk.52.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.52.attn_v.weightQ4_K[8192, 1024]
-
blk.52.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.52.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.53.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.attn_output.weightI8[8192, 8192]
-
blk.53.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.53.attn_v.weightQ4_K[8192, 1024]
-
blk.53.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.53.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.54.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.attn_output.weightI8[8192, 8192]
-
blk.54.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.54.attn_v.weightQ4_K[8192, 1024]
-
blk.54.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.54.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.55.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.attn_output.weightI8[8192, 8192]
-
blk.55.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.55.attn_v.weightQ4_K[8192, 1024]
-
blk.55.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.55.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.56.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.attn_output.weightI8[8192, 8192]
-
blk.56.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.56.attn_v.weightQ4_K[8192, 1024]
-
blk.56.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.56.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.57.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.attn_output.weightI8[8192, 8192]
-
blk.57.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.57.attn_v.weightQ4_K[8192, 1024]
-
blk.57.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.57.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.58.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.attn_output.weightI8[8192, 8192]
-
blk.58.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.58.attn_v.weightQ4_K[8192, 1024]
-
blk.58.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.58.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.59.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.attn_output.weightI8[8192, 8192]
-
blk.59.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.59.attn_v.weightQ4_K[8192, 1024]
-
blk.59.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.59.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.60.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.attn_output.weightI8[8192, 8192]
-
blk.60.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.60.attn_v.weightQ4_K[8192, 1024]
-
blk.60.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.60.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.61.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.attn_output.weightI8[8192, 8192]
-
blk.61.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.61.attn_v.weightQ4_K[8192, 1024]
-
blk.61.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.61.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.62.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.attn_output.weightI8[8192, 8192]
-
blk.62.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.62.attn_v.weightQ4_K[8192, 1024]
-
blk.62.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.62.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.63.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.attn_output.weightI8[8192, 8192]
-
blk.63.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.63.attn_v.weightQ4_K[8192, 1024]
-
blk.63.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.63.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.64.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.attn_output.weightI8[8192, 8192]
-
blk.64.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.64.attn_v.weightQ4_K[8192, 1024]
-
blk.64.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.64.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.65.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.attn_output.weightI8[8192, 8192]
-
blk.65.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.65.attn_v.weightQ4_K[8192, 1024]
-
blk.65.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.65.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.66.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.attn_output.weightI8[8192, 8192]
-
blk.66.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.66.attn_v.weightQ4_K[8192, 1024]
-
blk.66.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.66.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.67.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.attn_output.weightI8[8192, 8192]
-
blk.67.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.67.attn_v.weightQ4_K[8192, 1024]
-
blk.67.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.67.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.68.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.attn_output.weightI8[8192, 8192]
-
blk.68.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.68.attn_v.weightQ4_K[8192, 1024]
-
blk.68.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.68.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.69.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.attn_output.weightI8[8192, 8192]
-
blk.69.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.69.attn_v.weightQ4_K[8192, 1024]
-
blk.69.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.69.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.70.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.attn_output.weightI8[8192, 8192]
-
blk.70.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.70.attn_v.weightQ4_K[8192, 1024]
-
blk.70.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.70.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.71.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.attn_output.weightI8[8192, 8192]
-
blk.71.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.71.attn_v.weightQ4_K[8192, 1024]
-
blk.71.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.71.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.72.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.attn_output.weightI8[8192, 8192]
-
blk.72.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.72.attn_v.weightQ4_K[8192, 1024]
-
blk.72.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.72.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.73.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.attn_output.weightI8[8192, 8192]
-
blk.73.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.73.attn_v.weightQ4_K[8192, 1024]
-
blk.73.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.73.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.74.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.attn_output.weightI8[8192, 8192]
-
blk.74.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.74.attn_v.weightQ4_K[8192, 1024]
-
blk.74.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.74.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.75.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.attn_output.weightI8[8192, 8192]
-
blk.75.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.75.attn_v.weightQ4_K[8192, 1024]
-
blk.75.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.75.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.76.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.attn_output.weightI8[8192, 8192]
-
blk.76.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.76.attn_v.weightQ4_K[8192, 1024]
-
blk.76.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.76.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.77.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.attn_output.weightI8[8192, 8192]
-
blk.77.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.77.attn_v.weightQ4_K[8192, 1024]
-
blk.77.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.77.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.78.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.attn_output.weightI8[8192, 8192]
-
blk.78.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.78.attn_v.weightQ4_K[8192, 1024]
-
blk.78.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.78.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
blk.79.attn_k.weight(!unknown_type 29!)[8192, 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.attn_output.weightI8[8192, 8192]
-
blk.79.attn_q.weight(!unknown_type 29!)[8192, 8192]
-
blk.79.attn_v.weightQ4_K[8192, 1024]
-
blk.79.ffn_down.weight(!unknown_type 29!)[28672, 8192]
-
blk.79.ffn_gate.weight(!unknown_type 29!)[8192, 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.ffn_up.weight(!unknown_type 29!)[8192, 28672]
-
output.weightQ5_K[8192, 128256]
-
output_norm.weightF32[8192]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79