latest
37GB
35B
26 Pulls Updated 3 months ago
0f8bf723debd · 37GB
-
quantize.imatrix.chunks_count95
-
quantize.imatrix.dataset/training_data/groups_merged.txt
-
quantize.imatrix.entries_count280
-
quantize.imatrix.file/models/35b-beta-long-GGUF/35b-beta-long.imatrix
-
general.architecturecommand-r
-
general.file_typeQ8_0
-
command-r.attention.head_count64
-
command-r.attention.head_count_kv64
-
command-r.attention.layer_norm_epsilon1e-05
-
command-r.attention.layer_norm_rms_epsilon1e-05
-
command-r.block_count40
-
command-r.context_length128000
-
command-r.embedding_length8192
-
command-r.feed_forward_length22528
-
command-r.logit_scale0.0625
-
command-r.rope.freq_base8e+06
-
command-r.rope.scaling.typenone
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id5
-
tokenizer.ggml.eos_token_id6
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ a ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.precommand-r
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<PAD> <UNK> <CLS> <SEP> <MASK_TOKEN> ...]
-
NameTypeShape
-
token_embd.weightQ8_0[8192 256000]
-
blk.0.attn_k.weightQ8_0[8192 8192]
-
blk.0.attn_output.weightQ8_0[8192 8192]
-
blk.0.attn_q.weightQ8_0[8192 8192]
-
blk.0.attn_v.weightQ8_0[8192 8192]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ8_0[22528 8192]
-
blk.0.ffn_gate.weightQ8_0[8192 22528]
-
blk.0.ffn_up.weightQ8_0[8192 22528]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ8_0[22528 8192]
-
blk.1.ffn_gate.weightQ8_0[8192 22528]
-
blk.1.ffn_up.weightQ8_0[8192 22528]
-
blk.1.attn_k.weightQ8_0[8192 8192]
-
blk.1.attn_output.weightQ8_0[8192 8192]
-
blk.1.attn_q.weightQ8_0[8192 8192]
-
blk.1.attn_v.weightQ8_0[8192 8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ8_0[22528 8192]
-
blk.2.ffn_gate.weightQ8_0[8192 22528]
-
blk.2.ffn_up.weightQ8_0[8192 22528]
-
blk.2.attn_k.weightQ8_0[8192 8192]
-
blk.2.attn_output.weightQ8_0[8192 8192]
-
blk.2.attn_q.weightQ8_0[8192 8192]
-
blk.2.attn_v.weightQ8_0[8192 8192]
-
blk.3.attn_k.weightQ8_0[8192 8192]
-
blk.3.attn_output.weightQ8_0[8192 8192]
-
blk.3.attn_q.weightQ8_0[8192 8192]
-
blk.3.attn_v.weightQ8_0[8192 8192]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ8_0[22528 8192]
-
blk.3.ffn_gate.weightQ8_0[8192 22528]
-
blk.3.ffn_up.weightQ8_0[8192 22528]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ8_0[22528 8192]
-
blk.4.ffn_gate.weightQ8_0[8192 22528]
-
blk.4.ffn_up.weightQ8_0[8192 22528]
-
blk.4.attn_k.weightQ8_0[8192 8192]
-
blk.4.attn_output.weightQ8_0[8192 8192]
-
blk.4.attn_q.weightQ8_0[8192 8192]
-
blk.4.attn_v.weightQ8_0[8192 8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ8_0[22528 8192]
-
blk.5.ffn_gate.weightQ8_0[8192 22528]
-
blk.5.ffn_up.weightQ8_0[8192 22528]
-
blk.5.attn_k.weightQ8_0[8192 8192]
-
blk.5.attn_output.weightQ8_0[8192 8192]
-
blk.5.attn_q.weightQ8_0[8192 8192]
-
blk.5.attn_v.weightQ8_0[8192 8192]
-
blk.6.attn_k.weightQ8_0[8192 8192]
-
blk.6.attn_output.weightQ8_0[8192 8192]
-
blk.6.attn_q.weightQ8_0[8192 8192]
-
blk.6.attn_v.weightQ8_0[8192 8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ8_0[22528 8192]
-
blk.6.ffn_gate.weightQ8_0[8192 22528]
-
blk.6.ffn_up.weightQ8_0[8192 22528]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ8_0[22528 8192]
-
blk.7.ffn_gate.weightQ8_0[8192 22528]
-
blk.7.ffn_up.weightQ8_0[8192 22528]
-
blk.7.attn_k.weightQ8_0[8192 8192]
-
blk.7.attn_output.weightQ8_0[8192 8192]
-
blk.7.attn_q.weightQ8_0[8192 8192]
-
blk.7.attn_v.weightQ8_0[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ8_0[22528 8192]
-
blk.8.ffn_gate.weightQ8_0[8192 22528]
-
blk.8.ffn_up.weightQ8_0[8192 22528]
-
blk.8.attn_k.weightQ8_0[8192 8192]
-
blk.8.attn_output.weightQ8_0[8192 8192]
-
blk.8.attn_q.weightQ8_0[8192 8192]
-
blk.8.attn_v.weightQ8_0[8192 8192]
-
blk.9.attn_k.weightQ8_0[8192 8192]
-
blk.9.attn_output.weightQ8_0[8192 8192]
-
blk.9.attn_q.weightQ8_0[8192 8192]
-
blk.9.attn_v.weightQ8_0[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ8_0[22528 8192]
-
blk.9.ffn_gate.weightQ8_0[8192 22528]
-
blk.9.ffn_up.weightQ8_0[8192 22528]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ8_0[22528 8192]
-
blk.10.ffn_gate.weightQ8_0[8192 22528]
-
blk.10.ffn_up.weightQ8_0[8192 22528]
-
blk.10.attn_k.weightQ8_0[8192 8192]
-
blk.10.attn_output.weightQ8_0[8192 8192]
-
blk.10.attn_q.weightQ8_0[8192 8192]
-
blk.10.attn_v.weightQ8_0[8192 8192]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ8_0[22528 8192]
-
blk.11.ffn_gate.weightQ8_0[8192 22528]
-
blk.11.ffn_up.weightQ8_0[8192 22528]
-
blk.11.attn_k.weightQ8_0[8192 8192]
-
blk.11.attn_output.weightQ8_0[8192 8192]
-
blk.11.attn_q.weightQ8_0[8192 8192]
-
blk.11.attn_v.weightQ8_0[8192 8192]
-
blk.12.attn_k.weightQ8_0[8192 8192]
-
blk.12.attn_output.weightQ8_0[8192 8192]
-
blk.12.attn_q.weightQ8_0[8192 8192]
-
blk.12.attn_v.weightQ8_0[8192 8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ8_0[22528 8192]
-
blk.12.ffn_gate.weightQ8_0[8192 22528]
-
blk.12.ffn_up.weightQ8_0[8192 22528]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ8_0[22528 8192]
-
blk.13.ffn_gate.weightQ8_0[8192 22528]
-
blk.13.ffn_up.weightQ8_0[8192 22528]
-
blk.13.attn_k.weightQ8_0[8192 8192]
-
blk.13.attn_output.weightQ8_0[8192 8192]
-
blk.13.attn_q.weightQ8_0[8192 8192]
-
blk.13.attn_v.weightQ8_0[8192 8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ8_0[22528 8192]
-
blk.14.ffn_gate.weightQ8_0[8192 22528]
-
blk.14.ffn_up.weightQ8_0[8192 22528]
-
blk.14.attn_k.weightQ8_0[8192 8192]
-
blk.14.attn_output.weightQ8_0[8192 8192]
-
blk.14.attn_q.weightQ8_0[8192 8192]
-
blk.14.attn_v.weightQ8_0[8192 8192]
-
blk.15.attn_k.weightQ8_0[8192 8192]
-
blk.15.attn_output.weightQ8_0[8192 8192]
-
blk.15.attn_q.weightQ8_0[8192 8192]
-
blk.15.attn_v.weightQ8_0[8192 8192]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ8_0[22528 8192]
-
blk.15.ffn_gate.weightQ8_0[8192 22528]
-
blk.15.ffn_up.weightQ8_0[8192 22528]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ8_0[22528 8192]
-
blk.16.ffn_gate.weightQ8_0[8192 22528]
-
blk.16.ffn_up.weightQ8_0[8192 22528]
-
blk.16.attn_k.weightQ8_0[8192 8192]
-
blk.16.attn_output.weightQ8_0[8192 8192]
-
blk.16.attn_q.weightQ8_0[8192 8192]
-
blk.16.attn_v.weightQ8_0[8192 8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ8_0[22528 8192]
-
blk.17.ffn_gate.weightQ8_0[8192 22528]
-
blk.17.ffn_up.weightQ8_0[8192 22528]
-
blk.17.attn_k.weightQ8_0[8192 8192]
-
blk.17.attn_output.weightQ8_0[8192 8192]
-
blk.17.attn_q.weightQ8_0[8192 8192]
-
blk.17.attn_v.weightQ8_0[8192 8192]
-
blk.18.attn_k.weightQ8_0[8192 8192]
-
blk.18.attn_output.weightQ8_0[8192 8192]
-
blk.18.attn_q.weightQ8_0[8192 8192]
-
blk.18.attn_v.weightQ8_0[8192 8192]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ8_0[22528 8192]
-
blk.18.ffn_gate.weightQ8_0[8192 22528]
-
blk.18.ffn_up.weightQ8_0[8192 22528]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ8_0[22528 8192]
-
blk.19.ffn_gate.weightQ8_0[8192 22528]
-
blk.19.ffn_up.weightQ8_0[8192 22528]
-
blk.19.attn_k.weightQ8_0[8192 8192]
-
blk.19.attn_output.weightQ8_0[8192 8192]
-
blk.19.attn_q.weightQ8_0[8192 8192]
-
blk.19.attn_v.weightQ8_0[8192 8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ8_0[22528 8192]
-
blk.20.ffn_gate.weightQ8_0[8192 22528]
-
blk.20.ffn_up.weightQ8_0[8192 22528]
-
blk.20.attn_k.weightQ8_0[8192 8192]
-
blk.20.attn_output.weightQ8_0[8192 8192]
-
blk.20.attn_q.weightQ8_0[8192 8192]
-
blk.20.attn_v.weightQ8_0[8192 8192]
-
blk.21.attn_k.weightQ8_0[8192 8192]
-
blk.21.attn_output.weightQ8_0[8192 8192]
-
blk.21.attn_q.weightQ8_0[8192 8192]
-
blk.21.attn_v.weightQ8_0[8192 8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ8_0[22528 8192]
-
blk.21.ffn_gate.weightQ8_0[8192 22528]
-
blk.21.ffn_up.weightQ8_0[8192 22528]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ8_0[22528 8192]
-
blk.22.ffn_gate.weightQ8_0[8192 22528]
-
blk.22.ffn_up.weightQ8_0[8192 22528]
-
blk.22.attn_k.weightQ8_0[8192 8192]
-
blk.22.attn_output.weightQ8_0[8192 8192]
-
blk.22.attn_q.weightQ8_0[8192 8192]
-
blk.22.attn_v.weightQ8_0[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ8_0[22528 8192]
-
blk.23.ffn_gate.weightQ8_0[8192 22528]
-
blk.23.ffn_up.weightQ8_0[8192 22528]
-
blk.23.attn_k.weightQ8_0[8192 8192]
-
blk.23.attn_output.weightQ8_0[8192 8192]
-
blk.23.attn_q.weightQ8_0[8192 8192]
-
blk.23.attn_v.weightQ8_0[8192 8192]
-
blk.24.attn_k.weightQ8_0[8192 8192]
-
blk.24.attn_output.weightQ8_0[8192 8192]
-
blk.24.attn_q.weightQ8_0[8192 8192]
-
blk.24.attn_v.weightQ8_0[8192 8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ8_0[22528 8192]
-
blk.24.ffn_gate.weightQ8_0[8192 22528]
-
blk.24.ffn_up.weightQ8_0[8192 22528]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ8_0[22528 8192]
-
blk.25.ffn_gate.weightQ8_0[8192 22528]
-
blk.25.ffn_up.weightQ8_0[8192 22528]
-
blk.25.attn_k.weightQ8_0[8192 8192]
-
blk.25.attn_output.weightQ8_0[8192 8192]
-
blk.25.attn_q.weightQ8_0[8192 8192]
-
blk.25.attn_v.weightQ8_0[8192 8192]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ8_0[22528 8192]
-
blk.26.ffn_gate.weightQ8_0[8192 22528]
-
blk.26.ffn_up.weightQ8_0[8192 22528]
-
blk.26.attn_k.weightQ8_0[8192 8192]
-
blk.26.attn_output.weightQ8_0[8192 8192]
-
blk.26.attn_q.weightQ8_0[8192 8192]
-
blk.26.attn_v.weightQ8_0[8192 8192]
-
blk.27.attn_k.weightQ8_0[8192 8192]
-
blk.27.attn_output.weightQ8_0[8192 8192]
-
blk.27.attn_q.weightQ8_0[8192 8192]
-
blk.27.attn_v.weightQ8_0[8192 8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ8_0[22528 8192]
-
blk.27.ffn_gate.weightQ8_0[8192 22528]
-
blk.27.ffn_up.weightQ8_0[8192 22528]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ8_0[22528 8192]
-
blk.28.ffn_gate.weightQ8_0[8192 22528]
-
blk.28.ffn_up.weightQ8_0[8192 22528]
-
blk.28.attn_k.weightQ8_0[8192 8192]
-
blk.28.attn_output.weightQ8_0[8192 8192]
-
blk.28.attn_q.weightQ8_0[8192 8192]
-
blk.28.attn_v.weightQ8_0[8192 8192]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ8_0[22528 8192]
-
blk.29.ffn_gate.weightQ8_0[8192 22528]
-
blk.29.ffn_up.weightQ8_0[8192 22528]
-
blk.29.attn_k.weightQ8_0[8192 8192]
-
blk.29.attn_output.weightQ8_0[8192 8192]
-
blk.29.attn_q.weightQ8_0[8192 8192]
-
blk.29.attn_v.weightQ8_0[8192 8192]
-
blk.30.attn_k.weightQ8_0[8192 8192]
-
blk.30.attn_output.weightQ8_0[8192 8192]
-
blk.30.attn_q.weightQ8_0[8192 8192]
-
blk.30.attn_v.weightQ8_0[8192 8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ8_0[22528 8192]
-
blk.30.ffn_gate.weightQ8_0[8192 22528]
-
blk.30.ffn_up.weightQ8_0[8192 22528]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ8_0[22528 8192]
-
blk.31.ffn_gate.weightQ8_0[8192 22528]
-
blk.31.ffn_up.weightQ8_0[8192 22528]
-
blk.31.attn_k.weightQ8_0[8192 8192]
-
blk.31.attn_output.weightQ8_0[8192 8192]
-
blk.31.attn_q.weightQ8_0[8192 8192]
-
blk.31.attn_v.weightQ8_0[8192 8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ8_0[22528 8192]
-
blk.32.ffn_gate.weightQ8_0[8192 22528]
-
blk.32.ffn_up.weightQ8_0[8192 22528]
-
blk.32.attn_k.weightQ8_0[8192 8192]
-
blk.32.attn_output.weightQ8_0[8192 8192]
-
blk.32.attn_q.weightQ8_0[8192 8192]
-
blk.32.attn_v.weightQ8_0[8192 8192]
-
blk.33.attn_k.weightQ8_0[8192 8192]
-
blk.33.attn_output.weightQ8_0[8192 8192]
-
blk.33.attn_q.weightQ8_0[8192 8192]
-
blk.33.attn_v.weightQ8_0[8192 8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ8_0[22528 8192]
-
blk.33.ffn_gate.weightQ8_0[8192 22528]
-
blk.33.ffn_up.weightQ8_0[8192 22528]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ8_0[22528 8192]
-
blk.34.ffn_gate.weightQ8_0[8192 22528]
-
blk.34.ffn_up.weightQ8_0[8192 22528]
-
blk.34.attn_k.weightQ8_0[8192 8192]
-
blk.34.attn_output.weightQ8_0[8192 8192]
-
blk.34.attn_q.weightQ8_0[8192 8192]
-
blk.34.attn_v.weightQ8_0[8192 8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ8_0[22528 8192]
-
blk.35.ffn_gate.weightQ8_0[8192 22528]
-
blk.35.ffn_up.weightQ8_0[8192 22528]
-
blk.35.attn_k.weightQ8_0[8192 8192]
-
blk.35.attn_output.weightQ8_0[8192 8192]
-
blk.35.attn_q.weightQ8_0[8192 8192]
-
blk.35.attn_v.weightQ8_0[8192 8192]
-
blk.36.attn_k.weightQ8_0[8192 8192]
-
blk.36.attn_output.weightQ8_0[8192 8192]
-
blk.36.attn_q.weightQ8_0[8192 8192]
-
blk.36.attn_v.weightQ8_0[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ8_0[22528 8192]
-
blk.36.ffn_gate.weightQ8_0[8192 22528]
-
blk.36.ffn_up.weightQ8_0[8192 22528]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ8_0[22528 8192]
-
blk.37.ffn_gate.weightQ8_0[8192 22528]
-
blk.37.ffn_up.weightQ8_0[8192 22528]
-
blk.37.attn_k.weightQ8_0[8192 8192]
-
blk.37.attn_output.weightQ8_0[8192 8192]
-
blk.37.attn_q.weightQ8_0[8192 8192]
-
blk.37.attn_v.weightQ8_0[8192 8192]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ8_0[22528 8192]
-
blk.38.ffn_gate.weightQ8_0[8192 22528]
-
blk.38.ffn_up.weightQ8_0[8192 22528]
-
blk.38.attn_k.weightQ8_0[8192 8192]
-
blk.38.attn_output.weightQ8_0[8192 8192]
-
blk.38.attn_q.weightQ8_0[8192 8192]
-
blk.38.attn_v.weightQ8_0[8192 8192]
-
blk.39.attn_k.weightQ8_0[8192 8192]
-
blk.39.attn_output.weightQ8_0[8192 8192]
-
blk.39.attn_q.weightQ8_0[8192 8192]
-
blk.39.attn_v.weightQ8_0[8192 8192]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ8_0[22528 8192]
-
blk.39.ffn_gate.weightQ8_0[8192 22528]
-
blk.39.ffn_up.weightQ8_0[8192 22528]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39