latest
7.2GB
https://huggingface.co/WhiteRabbitNeo/WhiteRabbitNeo-7B-v1.5a
7B
304 Pulls Updated 7 months ago
4b28e031b54e · 7.2GB
-
general.architecturellama
-
general.file_typeQ8_0
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32022
-
tokenizer.ggml.eos_token_id32023
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
tokenizer.ggml.unknown_token_id32024
-
NameTypeShape
-
token_embd.weightQ8_0[4096 32256]
-
blk.0.attn_q.weightQ8_0[4096 4096]
-
blk.0.attn_k.weightQ8_0[4096 4096]
-
blk.0.attn_v.weightQ8_0[4096 4096]
-
blk.0.attn_output.weightQ8_0[4096 4096]
-
blk.0.ffn_gate.weightQ8_0[4096 11008]
-
blk.0.ffn_up.weightQ8_0[4096 11008]
-
blk.0.ffn_down.weightQ8_0[11008 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.1.attn_q.weightQ8_0[4096 4096]
-
blk.1.attn_k.weightQ8_0[4096 4096]
-
blk.1.attn_v.weightQ8_0[4096 4096]
-
blk.1.attn_output.weightQ8_0[4096 4096]
-
blk.1.ffn_gate.weightQ8_0[4096 11008]
-
blk.1.ffn_up.weightQ8_0[4096 11008]
-
blk.1.ffn_down.weightQ8_0[11008 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.2.attn_q.weightQ8_0[4096 4096]
-
blk.2.attn_k.weightQ8_0[4096 4096]
-
blk.2.attn_v.weightQ8_0[4096 4096]
-
blk.2.attn_output.weightQ8_0[4096 4096]
-
blk.2.ffn_gate.weightQ8_0[4096 11008]
-
blk.2.ffn_up.weightQ8_0[4096 11008]
-
blk.2.ffn_down.weightQ8_0[11008 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.3.attn_q.weightQ8_0[4096 4096]
-
blk.3.attn_k.weightQ8_0[4096 4096]
-
blk.3.attn_v.weightQ8_0[4096 4096]
-
blk.3.attn_output.weightQ8_0[4096 4096]
-
blk.3.ffn_gate.weightQ8_0[4096 11008]
-
blk.3.ffn_up.weightQ8_0[4096 11008]
-
blk.3.ffn_down.weightQ8_0[11008 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.4.attn_q.weightQ8_0[4096 4096]
-
blk.4.attn_k.weightQ8_0[4096 4096]
-
blk.4.attn_v.weightQ8_0[4096 4096]
-
blk.4.attn_output.weightQ8_0[4096 4096]
-
blk.4.ffn_gate.weightQ8_0[4096 11008]
-
blk.4.ffn_up.weightQ8_0[4096 11008]
-
blk.4.ffn_down.weightQ8_0[11008 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.5.attn_q.weightQ8_0[4096 4096]
-
blk.5.attn_k.weightQ8_0[4096 4096]
-
blk.5.attn_v.weightQ8_0[4096 4096]
-
blk.5.attn_output.weightQ8_0[4096 4096]
-
blk.5.ffn_gate.weightQ8_0[4096 11008]
-
blk.5.ffn_up.weightQ8_0[4096 11008]
-
blk.5.ffn_down.weightQ8_0[11008 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_q.weightQ8_0[4096 4096]
-
blk.6.attn_k.weightQ8_0[4096 4096]
-
blk.6.attn_v.weightQ8_0[4096 4096]
-
blk.6.attn_output.weightQ8_0[4096 4096]
-
blk.6.ffn_gate.weightQ8_0[4096 11008]
-
blk.6.ffn_up.weightQ8_0[4096 11008]
-
blk.6.ffn_down.weightQ8_0[11008 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.7.attn_q.weightQ8_0[4096 4096]
-
blk.7.attn_k.weightQ8_0[4096 4096]
-
blk.7.attn_v.weightQ8_0[4096 4096]
-
blk.7.attn_output.weightQ8_0[4096 4096]
-
blk.7.ffn_gate.weightQ8_0[4096 11008]
-
blk.7.ffn_up.weightQ8_0[4096 11008]
-
blk.7.ffn_down.weightQ8_0[11008 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.8.attn_q.weightQ8_0[4096 4096]
-
blk.8.attn_k.weightQ8_0[4096 4096]
-
blk.8.attn_v.weightQ8_0[4096 4096]
-
blk.8.attn_output.weightQ8_0[4096 4096]
-
blk.8.ffn_gate.weightQ8_0[4096 11008]
-
blk.8.ffn_up.weightQ8_0[4096 11008]
-
blk.8.ffn_down.weightQ8_0[11008 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.9.attn_q.weightQ8_0[4096 4096]
-
blk.9.attn_k.weightQ8_0[4096 4096]
-
blk.9.attn_v.weightQ8_0[4096 4096]
-
blk.9.attn_output.weightQ8_0[4096 4096]
-
blk.9.ffn_gate.weightQ8_0[4096 11008]
-
blk.9.ffn_up.weightQ8_0[4096 11008]
-
blk.9.ffn_down.weightQ8_0[11008 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.10.attn_q.weightQ8_0[4096 4096]
-
blk.10.attn_k.weightQ8_0[4096 4096]
-
blk.10.attn_v.weightQ8_0[4096 4096]
-
blk.10.attn_output.weightQ8_0[4096 4096]
-
blk.10.ffn_gate.weightQ8_0[4096 11008]
-
blk.10.ffn_up.weightQ8_0[4096 11008]
-
blk.10.ffn_down.weightQ8_0[11008 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_q.weightQ8_0[4096 4096]
-
blk.11.attn_k.weightQ8_0[4096 4096]
-
blk.11.attn_v.weightQ8_0[4096 4096]
-
blk.11.attn_output.weightQ8_0[4096 4096]
-
blk.11.ffn_gate.weightQ8_0[4096 11008]
-
blk.11.ffn_up.weightQ8_0[4096 11008]
-
blk.11.ffn_down.weightQ8_0[11008 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_q.weightQ8_0[4096 4096]
-
blk.12.attn_k.weightQ8_0[4096 4096]
-
blk.12.attn_v.weightQ8_0[4096 4096]
-
blk.12.attn_output.weightQ8_0[4096 4096]
-
blk.12.ffn_gate.weightQ8_0[4096 11008]
-
blk.12.ffn_up.weightQ8_0[4096 11008]
-
blk.12.ffn_down.weightQ8_0[11008 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_q.weightQ8_0[4096 4096]
-
blk.13.attn_k.weightQ8_0[4096 4096]
-
blk.13.attn_v.weightQ8_0[4096 4096]
-
blk.13.attn_output.weightQ8_0[4096 4096]
-
blk.13.ffn_gate.weightQ8_0[4096 11008]
-
blk.13.ffn_up.weightQ8_0[4096 11008]
-
blk.13.ffn_down.weightQ8_0[11008 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.14.attn_q.weightQ8_0[4096 4096]
-
blk.14.attn_k.weightQ8_0[4096 4096]
-
blk.14.attn_v.weightQ8_0[4096 4096]
-
blk.14.attn_output.weightQ8_0[4096 4096]
-
blk.14.ffn_gate.weightQ8_0[4096 11008]
-
blk.14.ffn_up.weightQ8_0[4096 11008]
-
blk.14.ffn_down.weightQ8_0[11008 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.15.attn_q.weightQ8_0[4096 4096]
-
blk.15.attn_k.weightQ8_0[4096 4096]
-
blk.15.attn_v.weightQ8_0[4096 4096]
-
blk.15.attn_output.weightQ8_0[4096 4096]
-
blk.15.ffn_gate.weightQ8_0[4096 11008]
-
blk.15.ffn_up.weightQ8_0[4096 11008]
-
blk.15.ffn_down.weightQ8_0[11008 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.16.attn_q.weightQ8_0[4096 4096]
-
blk.16.attn_k.weightQ8_0[4096 4096]
-
blk.16.attn_v.weightQ8_0[4096 4096]
-
blk.16.attn_output.weightQ8_0[4096 4096]
-
blk.16.ffn_gate.weightQ8_0[4096 11008]
-
blk.16.ffn_up.weightQ8_0[4096 11008]
-
blk.16.ffn_down.weightQ8_0[11008 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.17.attn_q.weightQ8_0[4096 4096]
-
blk.17.attn_k.weightQ8_0[4096 4096]
-
blk.17.attn_v.weightQ8_0[4096 4096]
-
blk.17.attn_output.weightQ8_0[4096 4096]
-
blk.17.ffn_gate.weightQ8_0[4096 11008]
-
blk.17.ffn_up.weightQ8_0[4096 11008]
-
blk.17.ffn_down.weightQ8_0[11008 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_q.weightQ8_0[4096 4096]
-
blk.18.attn_k.weightQ8_0[4096 4096]
-
blk.18.attn_v.weightQ8_0[4096 4096]
-
blk.18.attn_output.weightQ8_0[4096 4096]
-
blk.18.ffn_gate.weightQ8_0[4096 11008]
-
blk.18.ffn_up.weightQ8_0[4096 11008]
-
blk.18.ffn_down.weightQ8_0[11008 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.19.attn_q.weightQ8_0[4096 4096]
-
blk.19.attn_k.weightQ8_0[4096 4096]
-
blk.19.attn_v.weightQ8_0[4096 4096]
-
blk.19.attn_output.weightQ8_0[4096 4096]
-
blk.19.ffn_gate.weightQ8_0[4096 11008]
-
blk.19.ffn_up.weightQ8_0[4096 11008]
-
blk.19.ffn_down.weightQ8_0[11008 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.20.attn_q.weightQ8_0[4096 4096]
-
blk.20.attn_k.weightQ8_0[4096 4096]
-
blk.20.attn_v.weightQ8_0[4096 4096]
-
blk.20.attn_output.weightQ8_0[4096 4096]
-
blk.20.ffn_gate.weightQ8_0[4096 11008]
-
blk.20.ffn_up.weightQ8_0[4096 11008]
-
blk.20.ffn_down.weightQ8_0[11008 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.21.attn_q.weightQ8_0[4096 4096]
-
blk.21.attn_k.weightQ8_0[4096 4096]
-
blk.21.attn_v.weightQ8_0[4096 4096]
-
blk.21.attn_output.weightQ8_0[4096 4096]
-
blk.21.ffn_gate.weightQ8_0[4096 11008]
-
blk.21.ffn_up.weightQ8_0[4096 11008]
-
blk.21.ffn_down.weightQ8_0[11008 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.22.attn_q.weightQ8_0[4096 4096]
-
blk.22.attn_k.weightQ8_0[4096 4096]
-
blk.22.attn_v.weightQ8_0[4096 4096]
-
blk.22.attn_output.weightQ8_0[4096 4096]
-
blk.22.ffn_gate.weightQ8_0[4096 11008]
-
blk.22.ffn_up.weightQ8_0[4096 11008]
-
blk.22.ffn_down.weightQ8_0[11008 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_q.weightQ8_0[4096 4096]
-
blk.23.attn_k.weightQ8_0[4096 4096]
-
blk.23.attn_v.weightQ8_0[4096 4096]
-
blk.23.attn_output.weightQ8_0[4096 4096]
-
blk.23.ffn_gate.weightQ8_0[4096 11008]
-
blk.23.ffn_up.weightQ8_0[4096 11008]
-
blk.23.ffn_down.weightQ8_0[11008 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_q.weightQ8_0[4096 4096]
-
blk.24.attn_k.weightQ8_0[4096 4096]
-
blk.24.attn_v.weightQ8_0[4096 4096]
-
blk.24.attn_output.weightQ8_0[4096 4096]
-
blk.24.ffn_gate.weightQ8_0[4096 11008]
-
blk.24.ffn_up.weightQ8_0[4096 11008]
-
blk.24.ffn_down.weightQ8_0[11008 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.25.attn_q.weightQ8_0[4096 4096]
-
blk.25.attn_k.weightQ8_0[4096 4096]
-
blk.25.attn_v.weightQ8_0[4096 4096]
-
blk.25.attn_output.weightQ8_0[4096 4096]
-
blk.25.ffn_gate.weightQ8_0[4096 11008]
-
blk.25.ffn_up.weightQ8_0[4096 11008]
-
blk.25.ffn_down.weightQ8_0[11008 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.26.attn_q.weightQ8_0[4096 4096]
-
blk.26.attn_k.weightQ8_0[4096 4096]
-
blk.26.attn_v.weightQ8_0[4096 4096]
-
blk.26.attn_output.weightQ8_0[4096 4096]
-
blk.26.ffn_gate.weightQ8_0[4096 11008]
-
blk.26.ffn_up.weightQ8_0[4096 11008]
-
blk.26.ffn_down.weightQ8_0[11008 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.27.attn_q.weightQ8_0[4096 4096]
-
blk.27.attn_k.weightQ8_0[4096 4096]
-
blk.27.attn_v.weightQ8_0[4096 4096]
-
blk.27.attn_output.weightQ8_0[4096 4096]
-
blk.27.ffn_gate.weightQ8_0[4096 11008]
-
blk.27.ffn_up.weightQ8_0[4096 11008]
-
blk.27.ffn_down.weightQ8_0[11008 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.28.attn_q.weightQ8_0[4096 4096]
-
blk.28.attn_k.weightQ8_0[4096 4096]
-
blk.28.attn_v.weightQ8_0[4096 4096]
-
blk.28.attn_output.weightQ8_0[4096 4096]
-
blk.28.ffn_gate.weightQ8_0[4096 11008]
-
blk.28.ffn_up.weightQ8_0[4096 11008]
-
blk.28.ffn_down.weightQ8_0[11008 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.29.attn_q.weightQ8_0[4096 4096]
-
blk.29.attn_k.weightQ8_0[4096 4096]
-
blk.29.attn_v.weightQ8_0[4096 4096]
-
blk.29.attn_output.weightQ8_0[4096 4096]
-
blk.29.ffn_gate.weightQ8_0[4096 11008]
-
blk.29.ffn_up.weightQ8_0[4096 11008]
-
blk.29.ffn_down.weightQ8_0[11008 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_q.weightQ8_0[4096 4096]
-
blk.30.attn_k.weightQ8_0[4096 4096]
-
blk.30.attn_v.weightQ8_0[4096 4096]
-
blk.30.attn_output.weightQ8_0[4096 4096]
-
blk.30.ffn_gate.weightQ8_0[4096 11008]
-
blk.30.ffn_up.weightQ8_0[4096 11008]
-
blk.30.ffn_down.weightQ8_0[11008 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.31.attn_q.weightQ8_0[4096 4096]
-
blk.31.attn_k.weightQ8_0[4096 4096]
-
blk.31.attn_v.weightQ8_0[4096 4096]
-
blk.31.attn_output.weightQ8_0[4096 4096]
-
blk.31.ffn_gate.weightQ8_0[4096 11008]
-
blk.31.ffn_up.weightQ8_0[4096 11008]
-
blk.31.ffn_down.weightQ8_0[11008 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_norm.weightF32[4096]
-
output_norm.weightF32[4096]
-
output.weightQ8_0[4096 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31