latest
6.4GB
twodoerss
11B
Updated 6 weeks ago
ad5d403531dd · 6.4GB
-
general.architecturefalcon
-
general.file_typeQ4_0
-
falcon.attention.head_count32
-
falcon.attention.head_count_kv8
-
falcon.attention.layer_norm_epsilon1e-05
-
falcon.block_count60
-
falcon.context_length2048
-
falcon.embedding_length4096
-
falcon.feed_forward_length16384
-
falcon.tensor_data_layoutjploski
-
tokenizer.ggml.bos_token_id500
-
tokenizer.ggml.eos_token_id11
-
tokenizer.ggml.merges[Ġ t Ġ a i n h e r e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id11
-
tokenizer.ggml.prefalcon
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[>>TITLE<< >>ABSTRACT<< >>INTRODUCTION<< >>SUMMARY<< >>COMMENT<< ...]
-
NameTypeShape
-
token_embd.weightQ4_0[4096 65024]
-
blk.0.attn_norm.biasF32[4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ4_0[16384 4096]
-
blk.0.ffn_up.weightQ4_0[4096 16384]
-
blk.0.attn_output.weightQ4_0[4096 4096]
-
blk.0.attn_qkv.weightQ4_0[4096 6144]
-
blk.1.attn_norm.biasF32[4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ4_0[16384 4096]
-
blk.1.ffn_up.weightQ4_0[4096 16384]
-
blk.1.attn_output.weightQ4_0[4096 4096]
-
blk.1.attn_qkv.weightQ4_0[4096 6144]
-
blk.2.attn_norm.biasF32[4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ4_0[16384 4096]
-
blk.2.ffn_up.weightQ4_0[4096 16384]
-
blk.2.attn_output.weightQ4_0[4096 4096]
-
blk.2.attn_qkv.weightQ4_0[4096 6144]
-
blk.3.attn_norm.biasF32[4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ4_0[16384 4096]
-
blk.3.ffn_up.weightQ4_0[4096 16384]
-
blk.3.attn_output.weightQ4_0[4096 4096]
-
blk.3.attn_qkv.weightQ4_0[4096 6144]
-
blk.4.attn_norm.biasF32[4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ4_0[16384 4096]
-
blk.4.ffn_up.weightQ4_0[4096 16384]
-
blk.4.attn_output.weightQ4_0[4096 4096]
-
blk.4.attn_qkv.weightQ4_0[4096 6144]
-
blk.5.attn_norm.biasF32[4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ4_0[16384 4096]
-
blk.5.ffn_up.weightQ4_0[4096 16384]
-
blk.5.attn_output.weightQ4_0[4096 4096]
-
blk.5.attn_qkv.weightQ4_0[4096 6144]
-
blk.6.attn_norm.biasF32[4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ4_0[16384 4096]
-
blk.6.ffn_up.weightQ4_0[4096 16384]
-
blk.6.attn_output.weightQ4_0[4096 4096]
-
blk.6.attn_qkv.weightQ4_0[4096 6144]
-
blk.7.attn_norm.biasF32[4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ4_0[16384 4096]
-
blk.7.ffn_up.weightQ4_0[4096 16384]
-
blk.7.attn_output.weightQ4_0[4096 4096]
-
blk.7.attn_qkv.weightQ4_0[4096 6144]
-
blk.8.attn_norm.biasF32[4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ4_0[16384 4096]
-
blk.8.ffn_up.weightQ4_0[4096 16384]
-
blk.8.attn_output.weightQ4_0[4096 4096]
-
blk.8.attn_qkv.weightQ4_0[4096 6144]
-
blk.9.attn_norm.biasF32[4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ4_0[16384 4096]
-
blk.9.ffn_up.weightQ4_0[4096 16384]
-
blk.9.attn_output.weightQ4_0[4096 4096]
-
blk.9.attn_qkv.weightQ4_0[4096 6144]
-
blk.10.attn_norm.biasF32[4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ4_0[16384 4096]
-
blk.10.ffn_up.weightQ4_0[4096 16384]
-
blk.10.attn_output.weightQ4_0[4096 4096]
-
blk.10.attn_qkv.weightQ4_0[4096 6144]
-
blk.11.attn_norm.biasF32[4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ4_0[16384 4096]
-
blk.11.ffn_up.weightQ4_0[4096 16384]
-
blk.11.attn_output.weightQ4_0[4096 4096]
-
blk.11.attn_qkv.weightQ4_0[4096 6144]
-
blk.12.ffn_up.weightQ4_0[4096 16384]
-
blk.12.attn_output.weightQ4_0[4096 4096]
-
blk.12.attn_qkv.weightQ4_0[4096 6144]
-
blk.12.attn_norm.biasF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ4_0[16384 4096]
-
blk.13.attn_norm.biasF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ4_0[16384 4096]
-
blk.13.ffn_up.weightQ4_0[4096 16384]
-
blk.13.attn_output.weightQ4_0[4096 4096]
-
blk.13.attn_qkv.weightQ4_0[4096 6144]
-
blk.14.attn_norm.biasF32[4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ4_0[16384 4096]
-
blk.14.ffn_up.weightQ4_0[4096 16384]
-
blk.14.attn_output.weightQ4_0[4096 4096]
-
blk.14.attn_qkv.weightQ4_0[4096 6144]
-
blk.15.attn_norm.biasF32[4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ4_0[16384 4096]
-
blk.15.ffn_up.weightQ4_0[4096 16384]
-
blk.15.attn_output.weightQ4_0[4096 4096]
-
blk.15.attn_qkv.weightQ4_0[4096 6144]
-
blk.16.attn_norm.biasF32[4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ4_0[16384 4096]
-
blk.16.ffn_up.weightQ4_0[4096 16384]
-
blk.16.attn_output.weightQ4_0[4096 4096]
-
blk.16.attn_qkv.weightQ4_0[4096 6144]
-
blk.17.attn_norm.biasF32[4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ4_0[16384 4096]
-
blk.17.ffn_up.weightQ4_0[4096 16384]
-
blk.17.attn_output.weightQ4_0[4096 4096]
-
blk.17.attn_qkv.weightQ4_0[4096 6144]
-
blk.18.attn_norm.biasF32[4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ4_0[16384 4096]
-
blk.18.ffn_up.weightQ4_0[4096 16384]
-
blk.18.attn_output.weightQ4_0[4096 4096]
-
blk.18.attn_qkv.weightQ4_0[4096 6144]
-
blk.19.attn_norm.biasF32[4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ4_0[16384 4096]
-
blk.19.ffn_up.weightQ4_0[4096 16384]
-
blk.19.attn_output.weightQ4_0[4096 4096]
-
blk.19.attn_qkv.weightQ4_0[4096 6144]
-
blk.20.attn_norm.biasF32[4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ4_0[16384 4096]
-
blk.20.ffn_up.weightQ4_0[4096 16384]
-
blk.20.attn_output.weightQ4_0[4096 4096]
-
blk.20.attn_qkv.weightQ4_0[4096 6144]
-
blk.21.attn_norm.biasF32[4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ4_0[16384 4096]
-
blk.21.ffn_up.weightQ4_0[4096 16384]
-
blk.21.attn_output.weightQ4_0[4096 4096]
-
blk.21.attn_qkv.weightQ4_0[4096 6144]
-
blk.22.attn_norm.biasF32[4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ4_0[16384 4096]
-
blk.22.ffn_up.weightQ4_0[4096 16384]
-
blk.22.attn_output.weightQ4_0[4096 4096]
-
blk.22.attn_qkv.weightQ4_0[4096 6144]
-
blk.23.attn_norm.biasF32[4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ4_0[16384 4096]
-
blk.23.ffn_up.weightQ4_0[4096 16384]
-
blk.23.attn_output.weightQ4_0[4096 4096]
-
blk.23.attn_qkv.weightQ4_0[4096 6144]
-
blk.24.attn_norm.biasF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ4_0[16384 4096]
-
blk.24.ffn_up.weightQ4_0[4096 16384]
-
blk.24.attn_output.weightQ4_0[4096 4096]
-
blk.24.attn_qkv.weightQ4_0[4096 6144]
-
blk.25.attn_norm.biasF32[4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ4_0[16384 4096]
-
blk.25.ffn_up.weightQ4_0[4096 16384]
-
blk.25.attn_output.weightQ4_0[4096 4096]
-
blk.25.attn_qkv.weightQ4_0[4096 6144]
-
blk.26.ffn_up.weightQ4_0[4096 16384]
-
blk.26.attn_output.weightQ4_0[4096 4096]
-
blk.26.attn_qkv.weightQ4_0[4096 6144]
-
blk.26.attn_norm.biasF32[4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ4_0[16384 4096]
-
blk.27.attn_norm.biasF32[4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ4_0[16384 4096]
-
blk.27.ffn_up.weightQ4_0[4096 16384]
-
blk.27.attn_output.weightQ4_0[4096 4096]
-
blk.27.attn_qkv.weightQ4_0[4096 6144]
-
blk.28.attn_norm.biasF32[4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ4_0[16384 4096]
-
blk.28.ffn_up.weightQ4_0[4096 16384]
-
blk.28.attn_output.weightQ4_0[4096 4096]
-
blk.28.attn_qkv.weightQ4_0[4096 6144]
-
blk.29.attn_norm.biasF32[4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ4_0[16384 4096]
-
blk.29.ffn_up.weightQ4_0[4096 16384]
-
blk.29.attn_output.weightQ4_0[4096 4096]
-
blk.29.attn_qkv.weightQ4_0[4096 6144]
-
blk.30.attn_norm.biasF32[4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ4_0[16384 4096]
-
blk.30.ffn_up.weightQ4_0[4096 16384]
-
blk.30.attn_output.weightQ4_0[4096 4096]
-
blk.30.attn_qkv.weightQ4_0[4096 6144]
-
blk.31.attn_norm.biasF32[4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ4_0[16384 4096]
-
blk.31.ffn_up.weightQ4_0[4096 16384]
-
blk.31.attn_output.weightQ4_0[4096 4096]
-
blk.31.attn_qkv.weightQ4_0[4096 6144]
-
blk.32.attn_norm.biasF32[4096]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weightQ4_0[16384 4096]
-
blk.32.ffn_up.weightQ4_0[4096 16384]
-
blk.32.attn_output.weightQ4_0[4096 4096]
-
blk.32.attn_qkv.weightQ4_0[4096 6144]
-
blk.33.attn_norm.biasF32[4096]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weightQ4_0[16384 4096]
-
blk.33.ffn_up.weightQ4_0[4096 16384]
-
blk.33.attn_output.weightQ4_0[4096 4096]
-
blk.33.attn_qkv.weightQ4_0[4096 6144]
-
blk.34.attn_norm.biasF32[4096]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weightQ4_0[16384 4096]
-
blk.34.ffn_up.weightQ4_0[4096 16384]
-
blk.34.attn_output.weightQ4_0[4096 4096]
-
blk.34.attn_qkv.weightQ4_0[4096 6144]
-
blk.35.attn_norm.biasF32[4096]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weightQ4_0[16384 4096]
-
blk.35.ffn_up.weightQ4_0[4096 16384]
-
blk.35.attn_output.weightQ4_0[4096 4096]
-
blk.35.attn_qkv.weightQ4_0[4096 6144]
-
blk.36.attn_norm.biasF32[4096]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weightQ4_0[16384 4096]
-
blk.36.ffn_up.weightQ4_0[4096 16384]
-
blk.36.attn_output.weightQ4_0[4096 4096]
-
blk.36.attn_qkv.weightQ4_0[4096 6144]
-
blk.37.attn_norm.biasF32[4096]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weightQ4_0[16384 4096]
-
blk.37.ffn_up.weightQ4_0[4096 16384]
-
blk.37.attn_output.weightQ4_0[4096 4096]
-
blk.37.attn_qkv.weightQ4_0[4096 6144]
-
blk.38.attn_norm.biasF32[4096]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weightQ4_0[16384 4096]
-
blk.38.ffn_up.weightQ4_0[4096 16384]
-
blk.38.attn_output.weightQ4_0[4096 4096]
-
blk.38.attn_qkv.weightQ4_0[4096 6144]
-
blk.39.attn_norm.biasF32[4096]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weightQ4_0[16384 4096]
-
blk.39.ffn_up.weightQ4_0[4096 16384]
-
blk.39.attn_output.weightQ4_0[4096 4096]
-
blk.39.attn_qkv.weightQ4_0[4096 6144]
-
blk.40.ffn_up.weightQ4_0[4096 16384]
-
blk.40.attn_output.weightQ4_0[4096 4096]
-
blk.40.attn_qkv.weightQ4_0[4096 6144]
-
blk.40.attn_norm.biasF32[4096]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weightQ4_0[16384 4096]
-
blk.41.attn_norm.biasF32[4096]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weightQ4_0[16384 4096]
-
blk.41.ffn_up.weightQ4_0[4096 16384]
-
blk.41.attn_output.weightQ4_0[4096 4096]
-
blk.41.attn_qkv.weightQ4_0[4096 6144]
-
blk.42.attn_norm.biasF32[4096]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weightQ4_0[16384 4096]
-
blk.42.ffn_up.weightQ4_0[4096 16384]
-
blk.42.attn_output.weightQ4_0[4096 4096]
-
blk.42.attn_qkv.weightQ4_0[4096 6144]
-
blk.43.attn_norm.biasF32[4096]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weightQ4_0[16384 4096]
-
blk.43.ffn_up.weightQ4_0[4096 16384]
-
blk.43.attn_output.weightQ4_0[4096 4096]
-
blk.43.attn_qkv.weightQ4_0[4096 6144]
-
blk.44.attn_norm.biasF32[4096]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weightQ4_0[16384 4096]
-
blk.44.ffn_up.weightQ4_0[4096 16384]
-
blk.44.attn_output.weightQ4_0[4096 4096]
-
blk.44.attn_qkv.weightQ4_0[4096 6144]
-
blk.45.attn_norm.biasF32[4096]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weightQ4_0[16384 4096]
-
blk.45.ffn_up.weightQ4_0[4096 16384]
-
blk.45.attn_output.weightQ4_0[4096 4096]
-
blk.45.attn_qkv.weightQ4_0[4096 6144]
-
blk.46.attn_norm.biasF32[4096]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weightQ4_0[16384 4096]
-
blk.46.ffn_up.weightQ4_0[4096 16384]
-
blk.46.attn_output.weightQ4_0[4096 4096]
-
blk.46.attn_qkv.weightQ4_0[4096 6144]
-
blk.47.attn_norm.biasF32[4096]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weightQ4_0[16384 4096]
-
blk.47.ffn_up.weightQ4_0[4096 16384]
-
blk.47.attn_output.weightQ4_0[4096 4096]
-
blk.47.attn_qkv.weightQ4_0[4096 6144]
-
blk.48.attn_norm.biasF32[4096]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.ffn_down.weightQ4_0[16384 4096]
-
blk.48.ffn_up.weightQ4_0[4096 16384]
-
blk.48.attn_output.weightQ4_0[4096 4096]
-
blk.48.attn_qkv.weightQ4_0[4096 6144]
-
blk.49.attn_norm.biasF32[4096]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.ffn_down.weightQ4_0[16384 4096]
-
blk.49.ffn_up.weightQ4_0[4096 16384]
-
blk.49.attn_output.weightQ4_0[4096 4096]
-
blk.49.attn_qkv.weightQ4_0[4096 6144]
-
blk.50.attn_norm.biasF32[4096]
-
blk.50.attn_norm.weightF32[4096]
-
blk.50.ffn_down.weightQ4_0[16384 4096]
-
blk.50.ffn_up.weightQ4_0[4096 16384]
-
blk.50.attn_output.weightQ4_0[4096 4096]
-
blk.50.attn_qkv.weightQ4_0[4096 6144]
-
blk.51.attn_norm.biasF32[4096]
-
blk.51.attn_norm.weightF32[4096]
-
blk.51.ffn_down.weightQ4_0[16384 4096]
-
blk.51.ffn_up.weightQ4_0[4096 16384]
-
blk.51.attn_output.weightQ4_0[4096 4096]
-
blk.51.attn_qkv.weightQ4_0[4096 6144]
-
blk.52.attn_norm.biasF32[4096]
-
blk.52.attn_norm.weightF32[4096]
-
blk.52.ffn_down.weightQ4_0[16384 4096]
-
blk.52.ffn_up.weightQ4_0[4096 16384]
-
blk.52.attn_output.weightQ4_0[4096 4096]
-
blk.52.attn_qkv.weightQ4_0[4096 6144]
-
blk.53.attn_norm.biasF32[4096]
-
blk.53.attn_norm.weightF32[4096]
-
blk.53.ffn_down.weightQ4_0[16384 4096]
-
blk.53.ffn_up.weightQ4_0[4096 16384]
-
blk.53.attn_output.weightQ4_0[4096 4096]
-
blk.53.attn_qkv.weightQ4_0[4096 6144]
-
blk.54.ffn_up.weightQ4_0[4096 16384]
-
blk.54.attn_output.weightQ4_0[4096 4096]
-
blk.54.attn_qkv.weightQ4_0[4096 6144]
-
blk.54.attn_norm.biasF32[4096]
-
blk.54.attn_norm.weightF32[4096]
-
blk.54.ffn_down.weightQ4_0[16384 4096]
-
blk.55.attn_norm.biasF32[4096]
-
blk.55.attn_norm.weightF32[4096]
-
blk.55.ffn_down.weightQ4_0[16384 4096]
-
blk.55.ffn_up.weightQ4_0[4096 16384]
-
blk.55.attn_output.weightQ4_0[4096 4096]
-
blk.55.attn_qkv.weightQ4_0[4096 6144]
-
blk.56.attn_norm.biasF32[4096]
-
blk.56.attn_norm.weightF32[4096]
-
blk.56.ffn_down.weightQ4_0[16384 4096]
-
blk.56.ffn_up.weightQ4_0[4096 16384]
-
blk.56.attn_output.weightQ4_0[4096 4096]
-
blk.56.attn_qkv.weightQ4_0[4096 6144]
-
blk.57.attn_norm.biasF32[4096]
-
blk.57.attn_norm.weightF32[4096]
-
blk.57.ffn_down.weightQ4_0[16384 4096]
-
blk.57.ffn_up.weightQ4_0[4096 16384]
-
blk.57.attn_output.weightQ4_0[4096 4096]
-
blk.57.attn_qkv.weightQ4_0[4096 6144]
-
blk.58.attn_norm.biasF32[4096]
-
blk.58.attn_norm.weightF32[4096]
-
blk.58.ffn_down.weightQ4_0[16384 4096]
-
blk.58.ffn_up.weightQ4_0[4096 16384]
-
blk.58.attn_output.weightQ4_0[4096 4096]
-
blk.58.attn_qkv.weightQ4_0[4096 6144]
-
blk.59.attn_norm.biasF32[4096]
-
blk.59.attn_norm.weightF32[4096]
-
blk.59.ffn_down.weightQ4_0[16384 4096]
-
blk.59.ffn_up.weightQ4_0[4096 16384]
-
blk.59.attn_output.weightQ4_0[4096 4096]
-
blk.59.attn_qkv.weightQ4_0[4096 6144]
-
output.weightQ8_0[4096 65024]
-
output_norm.biasF32[4096]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59