latest
40GB
The ollama model for the 4bit-quantized GGUF version of llama3-70b-chinese-chat (https://huggingface.co/shenzhi-wang/Llama3-70B-Chinese-Chat-GGUF-4bit).
70B
1,822 Pulls Updated 4 months ago
23cd31b73d5d · 40GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length8192
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ġ Ġ Ġ ĠĠĠ ĠĠ ĠĠ ĠĠĠ Ġ i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128009
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[8192 128256]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[28672 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 28672]
-
blk.0.ffn_up.weightQ4_0[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.ffn_gate.weightQ4_0[8192 28672]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[28672 8192]
-
blk.1.ffn_up.weightQ4_0[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[28672 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 28672]
-
blk.2.ffn_up.weightQ4_0[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[28672 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 28672]
-
blk.3.ffn_up.weightQ4_0[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[28672 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 28672]
-
blk.4.ffn_up.weightQ4_0[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[28672 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 28672]
-
blk.5.ffn_up.weightQ4_0[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[28672 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 28672]
-
blk.6.ffn_up.weightQ4_0[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[28672 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 28672]
-
blk.7.ffn_up.weightQ4_0[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[28672 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 28672]
-
blk.8.ffn_up.weightQ4_0[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[28672 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 28672]
-
blk.9.ffn_up.weightQ4_0[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[28672 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 28672]
-
blk.10.ffn_up.weightQ4_0[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[28672 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 28672]
-
blk.11.ffn_up.weightQ4_0[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.12.ffn_gate.weightQ4_0[8192 28672]
-
blk.12.ffn_up.weightQ4_0[8192 28672]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[28672 8192]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[28672 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 28672]
-
blk.13.ffn_up.weightQ4_0[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[28672 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 28672]
-
blk.14.ffn_up.weightQ4_0[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.15.ffn_gate.weightQ4_0[8192 28672]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[28672 8192]
-
blk.15.ffn_up.weightQ4_0[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[28672 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 28672]
-
blk.16.ffn_up.weightQ4_0[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[28672 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 28672]
-
blk.17.ffn_up.weightQ4_0[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[28672 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 28672]
-
blk.18.ffn_up.weightQ4_0[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[28672 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 28672]
-
blk.19.ffn_up.weightQ4_0[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[28672 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 28672]
-
blk.20.ffn_up.weightQ4_0[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[28672 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 28672]
-
blk.21.ffn_up.weightQ4_0[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[28672 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 28672]
-
blk.22.ffn_up.weightQ4_0[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[28672 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 28672]
-
blk.23.ffn_up.weightQ4_0[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[28672 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 28672]
-
blk.24.ffn_up.weightQ4_0[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[28672 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 28672]
-
blk.25.ffn_up.weightQ4_0[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.26.ffn_gate.weightQ4_0[8192 28672]
-
blk.26.ffn_up.weightQ4_0[8192 28672]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[28672 8192]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[28672 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 28672]
-
blk.27.ffn_up.weightQ4_0[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[28672 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 28672]
-
blk.28.ffn_up.weightQ4_0[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.29.ffn_gate.weightQ4_0[8192 28672]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[28672 8192]
-
blk.29.ffn_up.weightQ4_0[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[28672 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 28672]
-
blk.30.ffn_up.weightQ4_0[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[28672 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 28672]
-
blk.31.ffn_up.weightQ4_0[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[28672 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 28672]
-
blk.32.ffn_up.weightQ4_0[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[28672 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 28672]
-
blk.33.ffn_up.weightQ4_0[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[28672 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 28672]
-
blk.34.ffn_up.weightQ4_0[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[28672 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 28672]
-
blk.35.ffn_up.weightQ4_0[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[28672 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 28672]
-
blk.36.ffn_up.weightQ4_0[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[28672 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 28672]
-
blk.37.ffn_up.weightQ4_0[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[28672 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 28672]
-
blk.38.ffn_up.weightQ4_0[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[28672 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 28672]
-
blk.39.ffn_up.weightQ4_0[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.40.ffn_gate.weightQ4_0[8192 28672]
-
blk.40.ffn_up.weightQ4_0[8192 28672]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[28672 8192]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[28672 8192]
-
blk.41.ffn_gate.weightQ4_0[8192 28672]
-
blk.41.ffn_up.weightQ4_0[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[28672 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 28672]
-
blk.42.ffn_up.weightQ4_0[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.43.ffn_gate.weightQ4_0[8192 28672]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[28672 8192]
-
blk.43.ffn_up.weightQ4_0[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[28672 8192]
-
blk.44.ffn_gate.weightQ4_0[8192 28672]
-
blk.44.ffn_up.weightQ4_0[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[28672 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 28672]
-
blk.45.ffn_up.weightQ4_0[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[28672 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 28672]
-
blk.46.ffn_up.weightQ4_0[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[28672 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 28672]
-
blk.47.ffn_up.weightQ4_0[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_0[28672 8192]
-
blk.48.ffn_gate.weightQ4_0[8192 28672]
-
blk.48.ffn_up.weightQ4_0[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_0[8192 1024]
-
blk.48.attn_output.weightQ4_0[8192 8192]
-
blk.48.attn_q.weightQ4_0[8192 8192]
-
blk.48.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_k.weightQ4_0[8192 1024]
-
blk.49.attn_q.weightQ4_0[8192 8192]
-
blk.49.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_0[28672 8192]
-
blk.49.ffn_gate.weightQ4_0[8192 28672]
-
blk.49.ffn_up.weightQ4_0[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ4_0[28672 8192]
-
blk.50.ffn_gate.weightQ4_0[8192 28672]
-
blk.50.ffn_up.weightQ4_0[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.weightQ4_0[8192 1024]
-
blk.50.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_q.weightQ4_0[8192 8192]
-
blk.50.attn_v.weightQ4_0[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_0[28672 8192]
-
blk.51.ffn_gate.weightQ4_0[8192 28672]
-
blk.51.ffn_up.weightQ4_0[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_0[8192 1024]
-
blk.51.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_q.weightQ4_0[8192 8192]
-
blk.51.attn_v.weightQ4_0[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_0[28672 8192]
-
blk.52.ffn_gate.weightQ4_0[8192 28672]
-
blk.52.ffn_up.weightQ4_0[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_0[8192 1024]
-
blk.52.attn_output.weightQ4_0[8192 8192]
-
blk.52.attn_q.weightQ4_0[8192 8192]
-
blk.52.attn_v.weightQ4_0[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_0[28672 8192]
-
blk.53.ffn_gate.weightQ4_0[8192 28672]
-
blk.53.ffn_up.weightQ4_0[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ4_0[8192 1024]
-
blk.53.attn_output.weightQ4_0[8192 8192]
-
blk.53.attn_q.weightQ4_0[8192 8192]
-
blk.53.attn_v.weightQ4_0[8192 1024]
-
blk.54.ffn_gate.weightQ4_0[8192 28672]
-
blk.54.ffn_up.weightQ4_0[8192 28672]
-
blk.54.attn_k.weightQ4_0[8192 1024]
-
blk.54.attn_output.weightQ4_0[8192 8192]
-
blk.54.attn_q.weightQ4_0[8192 8192]
-
blk.54.attn_v.weightQ4_0[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ4_0[28672 8192]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_0[28672 8192]
-
blk.55.ffn_gate.weightQ4_0[8192 28672]
-
blk.55.ffn_up.weightQ4_0[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightQ4_0[8192 1024]
-
blk.55.attn_output.weightQ4_0[8192 8192]
-
blk.55.attn_q.weightQ4_0[8192 8192]
-
blk.55.attn_v.weightQ4_0[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ4_0[28672 8192]
-
blk.56.ffn_gate.weightQ4_0[8192 28672]
-
blk.56.ffn_up.weightQ4_0[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ4_0[8192 1024]
-
blk.56.attn_output.weightQ4_0[8192 8192]
-
blk.56.attn_q.weightQ4_0[8192 8192]
-
blk.56.attn_v.weightQ4_0[8192 1024]
-
blk.57.ffn_gate.weightQ4_0[8192 28672]
-
blk.57.attn_k.weightQ4_0[8192 1024]
-
blk.57.attn_output.weightQ4_0[8192 8192]
-
blk.57.attn_q.weightQ4_0[8192 8192]
-
blk.57.attn_v.weightQ4_0[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ4_0[28672 8192]
-
blk.57.ffn_up.weightQ4_0[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_0[28672 8192]
-
blk.58.ffn_gate.weightQ4_0[8192 28672]
-
blk.58.ffn_up.weightQ4_0[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightQ4_0[8192 1024]
-
blk.58.attn_output.weightQ4_0[8192 8192]
-
blk.58.attn_q.weightQ4_0[8192 8192]
-
blk.58.attn_v.weightQ4_0[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_0[28672 8192]
-
blk.59.ffn_gate.weightQ4_0[8192 28672]
-
blk.59.ffn_up.weightQ4_0[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_0[8192 1024]
-
blk.59.attn_output.weightQ4_0[8192 8192]
-
blk.59.attn_q.weightQ4_0[8192 8192]
-
blk.59.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_k.weightQ4_0[8192 1024]
-
blk.60.attn_output.weightQ4_0[8192 8192]
-
blk.60.attn_q.weightQ4_0[8192 8192]
-
blk.60.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_0[28672 8192]
-
blk.60.ffn_gate.weightQ4_0[8192 28672]
-
blk.60.ffn_up.weightQ4_0[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_0[28672 8192]
-
blk.61.ffn_gate.weightQ4_0[8192 28672]
-
blk.61.ffn_up.weightQ4_0[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.weightQ4_0[8192 1024]
-
blk.61.attn_output.weightQ4_0[8192 8192]
-
blk.61.attn_q.weightQ4_0[8192 8192]
-
blk.61.attn_v.weightQ4_0[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_0[28672 8192]
-
blk.62.ffn_gate.weightQ4_0[8192 28672]
-
blk.62.ffn_up.weightQ4_0[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_0[8192 1024]
-
blk.62.attn_output.weightQ4_0[8192 8192]
-
blk.62.attn_q.weightQ4_0[8192 8192]
-
blk.62.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_k.weightQ4_0[8192 1024]
-
blk.63.attn_q.weightQ4_0[8192 8192]
-
blk.63.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_0[28672 8192]
-
blk.63.ffn_gate.weightQ4_0[8192 28672]
-
blk.63.ffn_up.weightQ4_0[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_0[28672 8192]
-
blk.64.ffn_gate.weightQ4_0[8192 28672]
-
blk.64.ffn_up.weightQ4_0[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.weightQ4_0[8192 1024]
-
blk.64.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_q.weightQ4_0[8192 8192]
-
blk.64.attn_v.weightQ4_0[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_0[28672 8192]
-
blk.65.ffn_gate.weightQ4_0[8192 28672]
-
blk.65.ffn_up.weightQ4_0[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_0[8192 1024]
-
blk.65.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_q.weightQ4_0[8192 8192]
-
blk.65.attn_v.weightQ4_0[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_0[28672 8192]
-
blk.66.ffn_gate.weightQ4_0[8192 28672]
-
blk.66.ffn_up.weightQ4_0[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_0[8192 1024]
-
blk.66.attn_output.weightQ4_0[8192 8192]
-
blk.66.attn_q.weightQ4_0[8192 8192]
-
blk.66.attn_v.weightQ4_0[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_0[28672 8192]
-
blk.67.ffn_gate.weightQ4_0[8192 28672]
-
blk.67.ffn_up.weightQ4_0[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ4_0[8192 1024]
-
blk.67.attn_output.weightQ4_0[8192 8192]
-
blk.67.attn_q.weightQ4_0[8192 8192]
-
blk.67.attn_v.weightQ4_0[8192 1024]
-
blk.68.ffn_gate.weightQ4_0[8192 28672]
-
blk.68.ffn_up.weightQ4_0[8192 28672]
-
blk.68.attn_k.weightQ4_0[8192 1024]
-
blk.68.attn_output.weightQ4_0[8192 8192]
-
blk.68.attn_q.weightQ4_0[8192 8192]
-
blk.68.attn_v.weightQ4_0[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_0[28672 8192]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_0[28672 8192]
-
blk.69.ffn_gate.weightQ4_0[8192 28672]
-
blk.69.ffn_up.weightQ4_0[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightQ4_0[8192 1024]
-
blk.69.attn_output.weightQ4_0[8192 8192]
-
blk.69.attn_q.weightQ4_0[8192 8192]
-
blk.69.attn_v.weightQ4_0[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ4_0[28672 8192]
-
blk.70.ffn_gate.weightQ4_0[8192 28672]
-
blk.70.ffn_up.weightQ4_0[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ4_0[8192 1024]
-
blk.70.attn_output.weightQ4_0[8192 8192]
-
blk.70.attn_q.weightQ4_0[8192 8192]
-
blk.70.attn_v.weightQ4_0[8192 1024]
-
blk.71.ffn_gate.weightQ4_0[8192 28672]
-
blk.71.attn_k.weightQ4_0[8192 1024]
-
blk.71.attn_output.weightQ4_0[8192 8192]
-
blk.71.attn_q.weightQ4_0[8192 8192]
-
blk.71.attn_v.weightQ4_0[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_0[28672 8192]
-
blk.71.ffn_up.weightQ4_0[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_0[28672 8192]
-
blk.72.ffn_gate.weightQ4_0[8192 28672]
-
blk.72.ffn_up.weightQ4_0[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightQ4_0[8192 1024]
-
blk.72.attn_output.weightQ4_0[8192 8192]
-
blk.72.attn_q.weightQ4_0[8192 8192]
-
blk.72.attn_v.weightQ4_0[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ4_0[28672 8192]
-
blk.73.ffn_gate.weightQ4_0[8192 28672]
-
blk.73.ffn_up.weightQ4_0[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_0[8192 1024]
-
blk.73.attn_output.weightQ4_0[8192 8192]
-
blk.73.attn_q.weightQ4_0[8192 8192]
-
blk.73.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_k.weightQ4_0[8192 1024]
-
blk.74.attn_output.weightQ4_0[8192 8192]
-
blk.74.attn_q.weightQ4_0[8192 8192]
-
blk.74.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_0[28672 8192]
-
blk.74.ffn_gate.weightQ4_0[8192 28672]
-
blk.74.ffn_up.weightQ4_0[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_0[28672 8192]
-
blk.75.ffn_gate.weightQ4_0[8192 28672]
-
blk.75.ffn_up.weightQ4_0[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.weightQ4_0[8192 1024]
-
blk.75.attn_output.weightQ4_0[8192 8192]
-
blk.75.attn_q.weightQ4_0[8192 8192]
-
blk.75.attn_v.weightQ4_0[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ4_0[28672 8192]
-
blk.76.ffn_gate.weightQ4_0[8192 28672]
-
blk.76.ffn_up.weightQ4_0[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_0[8192 1024]
-
blk.76.attn_output.weightQ4_0[8192 8192]
-
blk.76.attn_q.weightQ4_0[8192 8192]
-
blk.76.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_k.weightQ4_0[8192 1024]
-
blk.77.attn_q.weightQ4_0[8192 8192]
-
blk.77.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_0[28672 8192]
-
blk.77.ffn_gate.weightQ4_0[8192 28672]
-
blk.77.ffn_up.weightQ4_0[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_0[28672 8192]
-
blk.78.ffn_gate.weightQ4_0[8192 28672]
-
blk.78.ffn_up.weightQ4_0[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.weightQ4_0[8192 1024]
-
blk.78.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_q.weightQ4_0[8192 8192]
-
blk.78.attn_v.weightQ4_0[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_0[28672 8192]
-
blk.79.ffn_gate.weightQ4_0[8192 28672]
-
blk.79.ffn_up.weightQ4_0[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_0[8192 1024]
-
blk.79.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_q.weightQ4_0[8192 8192]
-
blk.79.attn_v.weightQ4_0[8192 1024]
-
output_norm.weightF32[8192]
-
output.weightQ6_K[8192 128256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79