https://huggingface.co/SakuraLLM/GalTransl-7B-v2
25 Pulls Updated 7 weeks ago
8749e704993a · 4.3GB
-
general.architectureqwen2
-
general.basenameGaltransl
-
general.file_type30
-
general.nameGaltransl 7B v2
-
general.quantization_version2
-
general.size_label7B
-
general.typemodel
-
general.versionv2
-
quantize.imatrix.chunks_count554
-
quantize.imatrix.datasetE:\imatrix.txt
-
quantize.imatrix.entries_count224
-
quantize.imatrix.fileE:\Galtransl-7B-v2\imatrix.dat
-
qwen2.attention.head_count32
-
qwen2.attention.head_count_kv32
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count32
-
qwen2.context_length32768
-
qwen2.embedding_length4096
-
qwen2.feed_forward_length11008
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ, ĠĠ ĠĠ, i n, Ġ t, ĠĠĠĠ ĠĠĠĠ, ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151645
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1, 1, 1, 1, 1, ...]
-
tokenizer.ggml.tokens[!, ", #, $, %, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[4096, 151936]
-
blk.0.attn_k.biasF32[4096]
-
blk.0.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_q.biasF32[4096]
-
blk.0.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.attn_v.biasF32[4096]
-
blk.0.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.0.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.1.attn_k.biasF32[4096]
-
blk.1.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_q.biasF32[4096]
-
blk.1.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.attn_v.biasF32[4096]
-
blk.1.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.1.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.2.attn_k.biasF32[4096]
-
blk.2.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_q.biasF32[4096]
-
blk.2.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.attn_v.biasF32[4096]
-
blk.2.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.2.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.3.attn_k.biasF32[4096]
-
blk.3.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_q.biasF32[4096]
-
blk.3.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.attn_v.biasF32[4096]
-
blk.3.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.3.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.4.attn_k.biasF32[4096]
-
blk.4.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_q.biasF32[4096]
-
blk.4.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.attn_v.biasF32[4096]
-
blk.4.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.4.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.5.attn_k.biasF32[4096]
-
blk.5.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_q.biasF32[4096]
-
blk.5.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.attn_v.biasF32[4096]
-
blk.5.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.5.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.6.attn_k.biasF32[4096]
-
blk.6.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_q.biasF32[4096]
-
blk.6.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.attn_v.biasF32[4096]
-
blk.6.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.6.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.7.attn_k.biasF32[4096]
-
blk.7.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_q.biasF32[4096]
-
blk.7.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.attn_v.biasF32[4096]
-
blk.7.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.7.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.8.attn_k.biasF32[4096]
-
blk.8.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_q.biasF32[4096]
-
blk.8.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.attn_v.biasF32[4096]
-
blk.8.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.8.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.9.attn_k.biasF32[4096]
-
blk.9.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_q.biasF32[4096]
-
blk.9.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.attn_v.biasF32[4096]
-
blk.9.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.9.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.10.attn_k.biasF32[4096]
-
blk.10.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_q.biasF32[4096]
-
blk.10.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.attn_v.biasF32[4096]
-
blk.10.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.10.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.11.attn_k.biasF32[4096]
-
blk.11.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_q.biasF32[4096]
-
blk.11.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.attn_v.biasF32[4096]
-
blk.11.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.11.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.12.attn_k.biasF32[4096]
-
blk.12.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_q.biasF32[4096]
-
blk.12.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.attn_v.biasF32[4096]
-
blk.12.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.12.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.13.attn_k.biasF32[4096]
-
blk.13.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_q.biasF32[4096]
-
blk.13.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.attn_v.biasF32[4096]
-
blk.13.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.13.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.14.attn_k.biasF32[4096]
-
blk.14.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_q.biasF32[4096]
-
blk.14.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.attn_v.biasF32[4096]
-
blk.14.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.14.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.15.attn_k.biasF32[4096]
-
blk.15.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_q.biasF32[4096]
-
blk.15.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.attn_v.biasF32[4096]
-
blk.15.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.15.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.16.attn_k.biasF32[4096]
-
blk.16.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_q.biasF32[4096]
-
blk.16.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.attn_v.biasF32[4096]
-
blk.16.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.16.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.17.attn_k.biasF32[4096]
-
blk.17.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_q.biasF32[4096]
-
blk.17.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.attn_v.biasF32[4096]
-
blk.17.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.17.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.18.attn_k.biasF32[4096]
-
blk.18.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_q.biasF32[4096]
-
blk.18.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.attn_v.biasF32[4096]
-
blk.18.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.18.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.19.attn_k.biasF32[4096]
-
blk.19.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_q.biasF32[4096]
-
blk.19.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.attn_v.biasF32[4096]
-
blk.19.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.19.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.20.attn_k.biasF32[4096]
-
blk.20.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_q.biasF32[4096]
-
blk.20.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.attn_v.biasF32[4096]
-
blk.20.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.20.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.21.attn_k.biasF32[4096]
-
blk.21.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_q.biasF32[4096]
-
blk.21.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.attn_v.biasF32[4096]
-
blk.21.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.21.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.22.attn_k.biasF32[4096]
-
blk.22.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_q.biasF32[4096]
-
blk.22.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.attn_v.biasF32[4096]
-
blk.22.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.22.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.23.attn_k.biasF32[4096]
-
blk.23.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_q.biasF32[4096]
-
blk.23.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.attn_v.biasF32[4096]
-
blk.23.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.23.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.24.attn_k.biasF32[4096]
-
blk.24.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_q.biasF32[4096]
-
blk.24.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.attn_v.biasF32[4096]
-
blk.24.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.24.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.25.attn_k.biasF32[4096]
-
blk.25.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_q.biasF32[4096]
-
blk.25.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.attn_v.biasF32[4096]
-
blk.25.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.25.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.26.attn_k.biasF32[4096]
-
blk.26.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_q.biasF32[4096]
-
blk.26.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.attn_v.biasF32[4096]
-
blk.26.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.26.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.27.attn_k.biasF32[4096]
-
blk.27.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_q.biasF32[4096]
-
blk.27.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.attn_v.biasF32[4096]
-
blk.27.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.27.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.28.attn_k.biasF32[4096]
-
blk.28.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_q.biasF32[4096]
-
blk.28.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.attn_v.biasF32[4096]
-
blk.28.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.28.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.29.attn_k.biasF32[4096]
-
blk.29.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_q.biasF32[4096]
-
blk.29.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.attn_v.biasF32[4096]
-
blk.29.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.29.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.30.attn_k.biasF32[4096]
-
blk.30.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_q.biasF32[4096]
-
blk.30.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.attn_v.biasF32[4096]
-
blk.30.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.30.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
blk.31.attn_k.biasF32[4096]
-
blk.31.attn_k.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_q.biasF32[4096]
-
blk.31.attn_q.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.attn_v.biasF32[4096]
-
blk.31.attn_v.weight(!unknown_type 23!)[4096, 4096]
-
blk.31.ffn_down.weight(!unknown_type 23!)[11008, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[4096, 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 23!)[4096, 11008]
-
output.weightQ6_K[4096, 151936]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31