latest
2.0GB
Replit Code v1.5 is a 3.3B parameter Causal Language Model focused on Code Completion.
311 Pulls Updated 5 months ago
e5f23238e18e · 2.0GB
-
general.architecturempt
-
general.file_typeQ4_0
-
mpt.attention.head_count24
-
mpt.attention.head_count_kv8
-
mpt.attention.layer_norm_epsilon1e-05
-
mpt.attention.max_alibi_bias8
-
mpt.block_count32
-
mpt.context_length4096
-
mpt.embedding_length3072
-
mpt.feed_forward_length12288
-
tokenizer.ggml.bos_token_id0
-
tokenizer.ggml.eos_token_id0
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ ĠĠĠĠ ĠĠĠĠ ĠĠ Ġ e r ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<|endoftext|> <|padding|> <fim_prefix> <fim_middle> <fim_suffix> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[3072 32768]
-
blk.0.attn_norm.weightF32[3072]
-
blk.0.attn_qkv.weightQ4_0[3072 5120]
-
blk.0.attn_output.weightQ4_0[3072 3072]
-
blk.0.ffn_norm.weightF32[3072]
-
blk.0.ffn_up.weightQ4_0[3072 12288]
-
blk.0.ffn_down.weightQ4_0[12288 3072]
-
blk.1.attn_norm.weightF32[3072]
-
blk.1.attn_qkv.weightQ4_0[3072 5120]
-
blk.1.attn_output.weightQ4_0[3072 3072]
-
blk.1.ffn_norm.weightF32[3072]
-
blk.1.ffn_up.weightQ4_0[3072 12288]
-
blk.1.ffn_down.weightQ4_0[12288 3072]
-
blk.2.attn_norm.weightF32[3072]
-
blk.2.attn_qkv.weightQ4_0[3072 5120]
-
blk.2.attn_output.weightQ4_0[3072 3072]
-
blk.2.ffn_norm.weightF32[3072]
-
blk.2.ffn_up.weightQ4_0[3072 12288]
-
blk.2.ffn_down.weightQ4_0[12288 3072]
-
blk.3.attn_norm.weightF32[3072]
-
blk.3.attn_qkv.weightQ4_0[3072 5120]
-
blk.3.attn_output.weightQ4_0[3072 3072]
-
blk.3.ffn_norm.weightF32[3072]
-
blk.3.ffn_up.weightQ4_0[3072 12288]
-
blk.3.ffn_down.weightQ4_0[12288 3072]
-
blk.4.attn_norm.weightF32[3072]
-
blk.4.attn_qkv.weightQ4_0[3072 5120]
-
blk.4.attn_output.weightQ4_0[3072 3072]
-
blk.4.ffn_norm.weightF32[3072]
-
blk.4.ffn_up.weightQ4_0[3072 12288]
-
blk.4.ffn_down.weightQ4_0[12288 3072]
-
blk.5.attn_norm.weightF32[3072]
-
blk.5.attn_qkv.weightQ4_0[3072 5120]
-
blk.5.attn_output.weightQ4_0[3072 3072]
-
blk.5.ffn_norm.weightF32[3072]
-
blk.5.ffn_up.weightQ4_0[3072 12288]
-
blk.5.ffn_down.weightQ4_0[12288 3072]
-
blk.6.attn_norm.weightF32[3072]
-
blk.6.attn_qkv.weightQ4_0[3072 5120]
-
blk.6.attn_output.weightQ4_0[3072 3072]
-
blk.6.ffn_norm.weightF32[3072]
-
blk.6.ffn_up.weightQ4_0[3072 12288]
-
blk.6.ffn_down.weightQ4_0[12288 3072]
-
blk.7.attn_norm.weightF32[3072]
-
blk.7.attn_qkv.weightQ4_0[3072 5120]
-
blk.7.attn_output.weightQ4_0[3072 3072]
-
blk.7.ffn_norm.weightF32[3072]
-
blk.7.ffn_up.weightQ4_0[3072 12288]
-
blk.7.ffn_down.weightQ4_0[12288 3072]
-
blk.8.attn_norm.weightF32[3072]
-
blk.8.attn_qkv.weightQ4_0[3072 5120]
-
blk.8.attn_output.weightQ4_0[3072 3072]
-
blk.8.ffn_norm.weightF32[3072]
-
blk.8.ffn_up.weightQ4_0[3072 12288]
-
blk.8.ffn_down.weightQ4_0[12288 3072]
-
blk.9.attn_norm.weightF32[3072]
-
blk.9.attn_qkv.weightQ4_0[3072 5120]
-
blk.9.attn_output.weightQ4_0[3072 3072]
-
blk.9.ffn_norm.weightF32[3072]
-
blk.9.ffn_up.weightQ4_0[3072 12288]
-
blk.9.ffn_down.weightQ4_0[12288 3072]
-
blk.10.attn_norm.weightF32[3072]
-
blk.10.attn_qkv.weightQ4_0[3072 5120]
-
blk.10.attn_output.weightQ4_0[3072 3072]
-
blk.10.ffn_norm.weightF32[3072]
-
blk.10.ffn_up.weightQ4_0[3072 12288]
-
blk.10.ffn_down.weightQ4_0[12288 3072]
-
blk.11.attn_norm.weightF32[3072]
-
blk.11.attn_qkv.weightQ4_0[3072 5120]
-
blk.11.attn_output.weightQ4_0[3072 3072]
-
blk.11.ffn_norm.weightF32[3072]
-
blk.11.ffn_up.weightQ4_0[3072 12288]
-
blk.11.ffn_down.weightQ4_0[12288 3072]
-
blk.12.attn_norm.weightF32[3072]
-
blk.12.attn_qkv.weightQ4_0[3072 5120]
-
blk.12.attn_output.weightQ4_0[3072 3072]
-
blk.12.ffn_norm.weightF32[3072]
-
blk.12.ffn_up.weightQ4_0[3072 12288]
-
blk.12.ffn_down.weightQ4_0[12288 3072]
-
blk.13.attn_norm.weightF32[3072]
-
blk.13.attn_qkv.weightQ4_0[3072 5120]
-
blk.13.attn_output.weightQ4_0[3072 3072]
-
blk.13.ffn_norm.weightF32[3072]
-
blk.13.ffn_up.weightQ4_0[3072 12288]
-
blk.13.ffn_down.weightQ4_0[12288 3072]
-
blk.14.attn_norm.weightF32[3072]
-
blk.14.attn_qkv.weightQ4_0[3072 5120]
-
blk.14.attn_output.weightQ4_0[3072 3072]
-
blk.14.ffn_norm.weightF32[3072]
-
blk.14.ffn_up.weightQ4_0[3072 12288]
-
blk.14.ffn_down.weightQ4_0[12288 3072]
-
blk.15.attn_norm.weightF32[3072]
-
blk.15.attn_qkv.weightQ4_0[3072 5120]
-
blk.15.attn_output.weightQ4_0[3072 3072]
-
blk.15.ffn_norm.weightF32[3072]
-
blk.15.ffn_up.weightQ4_0[3072 12288]
-
blk.15.ffn_down.weightQ4_0[12288 3072]
-
blk.16.attn_norm.weightF32[3072]
-
blk.16.attn_qkv.weightQ4_0[3072 5120]
-
blk.16.attn_output.weightQ4_0[3072 3072]
-
blk.16.ffn_norm.weightF32[3072]
-
blk.16.ffn_up.weightQ4_0[3072 12288]
-
blk.16.ffn_down.weightQ4_0[12288 3072]
-
blk.17.attn_norm.weightF32[3072]
-
blk.17.attn_qkv.weightQ4_0[3072 5120]
-
blk.17.attn_output.weightQ4_0[3072 3072]
-
blk.17.ffn_norm.weightF32[3072]
-
blk.17.ffn_up.weightQ4_0[3072 12288]
-
blk.17.ffn_down.weightQ4_0[12288 3072]
-
blk.18.attn_norm.weightF32[3072]
-
blk.18.attn_qkv.weightQ4_0[3072 5120]
-
blk.18.attn_output.weightQ4_0[3072 3072]
-
blk.18.ffn_norm.weightF32[3072]
-
blk.18.ffn_up.weightQ4_0[3072 12288]
-
blk.18.ffn_down.weightQ4_0[12288 3072]
-
blk.19.attn_norm.weightF32[3072]
-
blk.19.attn_qkv.weightQ4_0[3072 5120]
-
blk.19.attn_output.weightQ4_0[3072 3072]
-
blk.19.ffn_norm.weightF32[3072]
-
blk.19.ffn_up.weightQ4_0[3072 12288]
-
blk.19.ffn_down.weightQ4_0[12288 3072]
-
blk.20.attn_norm.weightF32[3072]
-
blk.20.attn_qkv.weightQ4_0[3072 5120]
-
blk.20.attn_output.weightQ4_0[3072 3072]
-
blk.20.ffn_norm.weightF32[3072]
-
blk.20.ffn_up.weightQ4_0[3072 12288]
-
blk.20.ffn_down.weightQ4_0[12288 3072]
-
blk.21.attn_norm.weightF32[3072]
-
blk.21.attn_qkv.weightQ4_0[3072 5120]
-
blk.21.attn_output.weightQ4_0[3072 3072]
-
blk.21.ffn_norm.weightF32[3072]
-
blk.21.ffn_up.weightQ4_0[3072 12288]
-
blk.21.ffn_down.weightQ4_0[12288 3072]
-
blk.22.attn_norm.weightF32[3072]
-
blk.22.attn_qkv.weightQ4_0[3072 5120]
-
blk.22.attn_output.weightQ4_0[3072 3072]
-
blk.22.ffn_norm.weightF32[3072]
-
blk.22.ffn_up.weightQ4_0[3072 12288]
-
blk.22.ffn_down.weightQ4_0[12288 3072]
-
blk.23.attn_norm.weightF32[3072]
-
blk.23.attn_qkv.weightQ4_0[3072 5120]
-
blk.23.attn_output.weightQ4_0[3072 3072]
-
blk.23.ffn_norm.weightF32[3072]
-
blk.23.ffn_up.weightQ4_0[3072 12288]
-
blk.23.ffn_down.weightQ4_0[12288 3072]
-
blk.24.attn_norm.weightF32[3072]
-
blk.24.attn_qkv.weightQ4_0[3072 5120]
-
blk.24.attn_output.weightQ4_0[3072 3072]
-
blk.24.ffn_norm.weightF32[3072]
-
blk.24.ffn_up.weightQ4_0[3072 12288]
-
blk.24.ffn_down.weightQ4_0[12288 3072]
-
blk.25.attn_norm.weightF32[3072]
-
blk.25.attn_qkv.weightQ4_0[3072 5120]
-
blk.25.attn_output.weightQ4_0[3072 3072]
-
blk.25.ffn_norm.weightF32[3072]
-
blk.25.ffn_up.weightQ4_0[3072 12288]
-
blk.25.ffn_down.weightQ4_0[12288 3072]
-
blk.26.attn_norm.weightF32[3072]
-
blk.26.attn_qkv.weightQ4_0[3072 5120]
-
blk.26.attn_output.weightQ4_0[3072 3072]
-
blk.26.ffn_norm.weightF32[3072]
-
blk.26.ffn_up.weightQ4_0[3072 12288]
-
blk.26.ffn_down.weightQ4_0[12288 3072]
-
blk.27.attn_norm.weightF32[3072]
-
blk.27.attn_qkv.weightQ4_0[3072 5120]
-
blk.27.attn_output.weightQ4_0[3072 3072]
-
blk.27.ffn_norm.weightF32[3072]
-
blk.27.ffn_up.weightQ4_0[3072 12288]
-
blk.27.ffn_down.weightQ4_0[12288 3072]
-
blk.28.attn_norm.weightF32[3072]
-
blk.28.attn_qkv.weightQ4_0[3072 5120]
-
blk.28.attn_output.weightQ4_0[3072 3072]
-
blk.28.ffn_norm.weightF32[3072]
-
blk.28.ffn_up.weightQ4_0[3072 12288]
-
blk.28.ffn_down.weightQ4_0[12288 3072]
-
blk.29.attn_norm.weightF32[3072]
-
blk.29.attn_qkv.weightQ4_0[3072 5120]
-
blk.29.attn_output.weightQ4_0[3072 3072]
-
blk.29.ffn_norm.weightF32[3072]
-
blk.29.ffn_up.weightQ4_0[3072 12288]
-
blk.29.ffn_down.weightQ4_0[12288 3072]
-
blk.30.attn_norm.weightF32[3072]
-
blk.30.attn_qkv.weightQ4_0[3072 5120]
-
blk.30.attn_output.weightQ4_0[3072 3072]
-
blk.30.ffn_norm.weightF32[3072]
-
blk.30.ffn_up.weightQ4_0[3072 12288]
-
blk.30.ffn_down.weightQ4_0[12288 3072]
-
blk.31.attn_norm.weightF32[3072]
-
blk.31.attn_qkv.weightQ4_0[3072 5120]
-
blk.31.attn_output.weightQ4_0[3072 3072]
-
blk.31.ffn_norm.weightF32[3072]
-
blk.31.ffn_up.weightQ4_0[3072 12288]
-
blk.31.ffn_down.weightQ4_0[12288 3072]
-
output.weightQ6_K[3072 32768]
-
output_norm.weightF32[3072]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31