a small general purpose model with enticing roleplaying models. Introduce better RAG capabilities in the form of Bagel to Llama 3 8B Instruct as well as German multilanguage, higher general intelligence and vision support.

8B

399 Pulls Updated 7 weeks ago

744d54c5070d · 5.7GB
{ "metadata": { "general.architecture": "llama", "general.file_type": 17, "general.name": "Llama-3-8B-Ultra-Instruct", "general.quantization_version": 2, "llama.attention.head_count": 32, "llama.attention.head_count_kv": 8, "llama.attention.layer_norm_rms_epsilon": 0.00001, "llama.block_count": 32, "llama.context_length": 8192, "llama.embedding_length": 4096, "llama.feed_forward_length": 14336, "llama.rope.dimension_count": 128, "llama.rope.freq_base": 500000, "llama.vocab_size": 128256, "quantize.imatrix.chunks_count": 88, "quantize.imatrix.dataset": "/training_data/groups_merged.txt", "quantize.imatrix.entries_count": 224, "quantize.imatrix.file": "/models/Llama-3-8B-Ultra-Instruct-GGUF/Llama-3-8B-Ultra-Instruct.imatrix", "tokenizer.ggml.bos_token_id": 128000, "tokenizer.ggml.eos_token_id": 128001, "tokenizer.ggml.merges": "... (280147 values)", "tokenizer.ggml.model": "gpt2", "tokenizer.ggml.pre": "llama-bpe", "tokenizer.ggml.token_type": "... (128256 values)", "tokenizer.ggml.tokens": "... (128256 values)" }, "num_params": 8030261248, "tensors": [ { "name": "token_embd.weight", "offset": 430940160, "shape": [ 4096, 128256 ], "size": 430940160, "type": 13 }, { "name": "blk.0.attn_norm.weight", "offset": 792109056, "shape": [ 4096 ], "size": 361168896, "type": 0 }, { "name": "blk.0.ffn_down.weight", "offset": 792125440, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "\u0000\u0000\u0010\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0000\ufffdy\ufffd\u0000\u0000\u0000\u0000", "offset": 840294400, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.0.ffn_up.weight", "offset": 880664576, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.0.ffn_norm.weight", "offset": 921034752, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.0.attn_k.weight", "offset": 921051136, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.0.attn_output.weight", "offset": 923934720, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.0.attn_q.weight", "offset": 935469056, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.0.attn_v.weight", "offset": 947003392, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.1.attn_norm.weight", "offset": 950444032, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.1.ffn_down.weight", "offset": 950460416, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.1.ffn_gate.weight", "offset": 998629376, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.1.ffn_up.weight", "offset": 1038999552, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.1.ffn_norm.weight", "offset": 1079369728, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.1.attn_k.weight", "offset": 1079386112, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.1.attn_output.weight", "offset": 1082269696, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.1.attn_q.weight", "offset": 1093804032, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.1.attn_v.weight", "offset": 1105338368, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.10.attn_norm.weight", "offset": 1108779008, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.10.ffn_down.weight", "offset": 1108795392, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.10.ffn_gate.weight", "offset": 1156964352, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.10.ffn_up.weight", "offset": 1197334528, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.10.ffn_norm.weight", "offset": 1237704704, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.10.attn_k.weight", "offset": 1237721088, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.10.attn_output.weight", "offset": 1240604672, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.10.attn_q.weight", "offset": 1252139008, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.10.attn_v.weight", "offset": 1263673344, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.11.attn_norm.weight", "offset": 1267113984, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.11.ffn_down.weight", "offset": 1267130368, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.11.ffn_gate.weight", "offset": 1315299328, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.11.ffn_up.weight", "offset": 1355669504, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.11.ffn_norm.weight", "offset": 1396039680, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.11.attn_k.weight", "offset": 1396056064, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.11.attn_output.weight", "offset": 1398939648, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.11.attn_q.weight", "offset": 1410473984, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.11.attn_v.weight", "offset": 1422008320, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.12.attn_norm.weight", "offset": 1425448960, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.12.ffn_down.weight", "offset": 1425465344, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.12.ffn_gate.weight", "offset": 1465835520, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.12.ffn_up.weight", "offset": 1506205696, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.12.ffn_norm.weight", "offset": 1546575872, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.12.attn_k.weight", "offset": 1546592256, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.12.attn_output.weight", "offset": 1549475840, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.12.attn_q.weight", "offset": 1561010176, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.12.attn_v.weight", "offset": 1572544512, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.13.attn_norm.weight", "offset": 1575428096, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.13.ffn_down.weight", "offset": 1575444480, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.13.ffn_gate.weight", "offset": 1615814656, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.13.ffn_up.weight", "offset": 1656184832, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.13.ffn_norm.weight", "offset": 1696555008, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.13.attn_k.weight", "offset": 1696571392, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.13.attn_output.weight", "offset": 1699454976, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.13.attn_q.weight", "offset": 1710989312, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.13.attn_v.weight", "offset": 1722523648, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.14.attn_norm.weight", "offset": 1725407232, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.14.ffn_down.weight", "offset": 1725423616, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.14.ffn_gate.weight", "offset": 1773592576, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.14.ffn_up.weight", "offset": 1813962752, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.14.ffn_norm.weight", "offset": 1854332928, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.14.attn_k.weight", "offset": 1854349312, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.14.attn_output.weight", "offset": 1857232896, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.14.attn_q.weight", "offset": 1868767232, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.14.attn_v.weight", "offset": 1880301568, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.15.attn_norm.weight", "offset": 1883742208, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.15.ffn_down.weight", "offset": 1883758592, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.15.ffn_gate.weight", "offset": 1924128768, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.15.ffn_up.weight", "offset": 1964498944, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.15.ffn_norm.weight", "offset": 2004869120, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.15.attn_k.weight", "offset": 2004885504, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.15.attn_output.weight", "offset": 2007769088, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.15.attn_q.weight", "offset": 2019303424, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.15.attn_v.weight", "offset": 2030837760, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.16.attn_norm.weight", "offset": 2033721344, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.16.ffn_down.weight", "offset": 2033737728, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.16.ffn_gate.weight", "offset": 2074107904, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.16.ffn_up.weight", "offset": 2114478080, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.16.ffn_norm.weight", "offset": 2154848256, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.16.attn_k.weight", "offset": 2154864640, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.16.attn_output.weight", "offset": 2157748224, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.16.attn_q.weight", "offset": 2169282560, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.16.attn_v.weight", "offset": 2180816896, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.17.attn_norm.weight", "offset": 2183700480, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.17.ffn_down.weight", "offset": 2183716864, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.17.ffn_gate.weight", "offset": 2231885824, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.17.ffn_up.weight", "offset": 2272256000, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.17.ffn_norm.weight", "offset": 2312626176, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.17.attn_k.weight", "offset": 2312642560, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.17.attn_output.weight", "offset": 2315526144, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.17.attn_q.weight", "offset": 2327060480, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.17.attn_v.weight", "offset": 2338594816, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.18.attn_norm.weight", "offset": 2342035456, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.18.ffn_down.weight", "offset": 2342051840, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.18.ffn_gate.weight", "offset": 2382422016, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.18.ffn_up.weight", "offset": 2422792192, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.18.ffn_norm.weight", "offset": 2463162368, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.18.attn_k.weight", "offset": 2463178752, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.18.attn_output.weight", "offset": 2466062336, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.18.attn_q.weight", "offset": 2477596672, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.18.attn_v.weight", "offset": 2489131008, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.19.attn_norm.weight", "offset": 2492014592, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.19.ffn_down.weight", "offset": 2492030976, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.19.ffn_gate.weight", "offset": 2532401152, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.19.ffn_up.weight", "offset": 2572771328, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.19.ffn_norm.weight", "offset": 2613141504, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.19.attn_k.weight", "offset": 2613157888, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.19.attn_output.weight", "offset": 2616041472, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.19.attn_q.weight", "offset": 2627575808, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.19.attn_v.weight", "offset": 2639110144, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.2.attn_norm.weight", "offset": 2641993728, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.2.ffn_down.weight", "offset": 2642010112, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.2.ffn_gate.weight", "offset": 2690179072, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.2.ffn_up.weight", "offset": 2730549248, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.2.ffn_norm.weight", "offset": 2770919424, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.2.attn_k.weight", "offset": 2770935808, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.2.attn_output.weight", "offset": 2773819392, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.2.attn_q.weight", "offset": 2785353728, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.2.attn_v.weight", "offset": 2796888064, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.20.attn_norm.weight", "offset": 2800328704, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.20.ffn_down.weight", "offset": 2800345088, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.20.ffn_gate.weight", "offset": 2840715264, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.20.ffn_up.weight", "offset": 2881085440, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.20.ffn_norm.weight", "offset": 2921455616, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.20.attn_k.weight", "offset": 2921472000, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.20.attn_output.weight", "offset": 2924355584, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.20.attn_q.weight", "offset": 2935889920, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.20.attn_v.weight", "offset": 2947424256, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.21.attn_norm.weight", "offset": 2950307840, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.21.ffn_down.weight", "offset": 2950324224, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.21.ffn_gate.weight", "offset": 2990694400, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.21.ffn_up.weight", "offset": 3031064576, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.21.ffn_norm.weight", "offset": 3071434752, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.21.attn_k.weight", "offset": 3071451136, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.21.attn_output.weight", "offset": 3074334720, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.21.attn_q.weight", "offset": 3085869056, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.21.attn_v.weight", "offset": 3097403392, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.22.attn_norm.weight", "offset": 3100286976, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.22.ffn_down.weight", "offset": 3100303360, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.22.ffn_gate.weight", "offset": 3148472320, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.22.ffn_up.weight", "offset": 3188842496, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.22.ffn_norm.weight", "offset": 3229212672, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.22.attn_k.weight", "offset": 3229229056, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.22.attn_output.weight", "offset": 3232112640, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.22.attn_q.weight", "offset": 3243646976, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.22.attn_v.weight", "offset": 3255181312, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.23.attn_norm.weight", "offset": 3258621952, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.23.ffn_down.weight", "offset": 3258638336, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.23.ffn_gate.weight", "offset": 3299008512, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.23.ffn_up.weight", "offset": 3339378688, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.23.ffn_norm.weight", "offset": 3379748864, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.23.attn_k.weight", "offset": 3379765248, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.23.attn_output.weight", "offset": 3382648832, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.23.attn_q.weight", "offset": 3394183168, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.23.attn_v.weight", "offset": 3405717504, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.24.attn_norm.weight", "offset": 3408601088, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.24.ffn_down.weight", "offset": 3408617472, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.24.ffn_gate.weight", "offset": 3448987648, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.24.ffn_up.weight", "offset": 3489357824, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.24.ffn_norm.weight", "offset": 3529728000, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.24.attn_k.weight", "offset": 3529744384, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.24.attn_output.weight", "offset": 3532627968, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.24.attn_q.weight", "offset": 3544162304, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.24.attn_v.weight", "offset": 3555696640, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.25.attn_norm.weight", "offset": 3558580224, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.25.ffn_down.weight", "offset": 3558596608, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.25.ffn_gate.weight", "offset": 3606765568, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.25.ffn_up.weight", "offset": 3647135744, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.25.ffn_norm.weight", "offset": 3687505920, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.25.attn_k.weight", "offset": 3687522304, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.25.attn_output.weight", "offset": 3690405888, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.25.attn_q.weight", "offset": 3701940224, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.25.attn_v.weight", "offset": 3713474560, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.26.attn_norm.weight", "offset": 3716915200, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.26.ffn_down.weight", "offset": 3716931584, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.26.ffn_gate.weight", "offset": 3757301760, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.26.ffn_up.weight", "offset": 3797671936, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.26.ffn_norm.weight", "offset": 3838042112, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.26.attn_k.weight", "offset": 3838058496, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.26.attn_output.weight", "offset": 3840942080, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.26.attn_q.weight", "offset": 3852476416, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.26.attn_v.weight", "offset": 3864010752, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.27.attn_norm.weight", "offset": 3866894336, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.27.ffn_down.weight", "offset": 3866910720, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.27.ffn_gate.weight", "offset": 3907280896, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.27.ffn_up.weight", "offset": 3947651072, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.27.ffn_norm.weight", "offset": 3988021248, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.27.attn_k.weight", "offset": 3988037632, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.27.attn_output.weight", "offset": 3990921216, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.27.attn_q.weight", "offset": 4002455552, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.27.attn_v.weight", "offset": 4013989888, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.28.attn_norm.weight", "offset": 4016873472, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.28.ffn_down.weight", "offset": 4016889856, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.28.ffn_gate.weight", "offset": 4065058816, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.28.ffn_up.weight", "offset": 4105428992, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.28.ffn_norm.weight", "offset": 4145799168, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.28.attn_k.weight", "offset": 4145815552, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.28.attn_output.weight", "offset": 4148699136, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.28.attn_q.weight", "offset": 4160233472, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.28.attn_v.weight", "offset": 4171767808, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.29.attn_norm.weight", "offset": 4175208448, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.29.ffn_down.weight", "offset": 4175224832, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.29.ffn_gate.weight", "offset": 4215595008, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.29.ffn_up.weight", "offset": 4255965184, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.29.ffn_norm.weight", "offset": 4296335360, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.29.attn_k.weight", "offset": 4296351744, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.29.attn_output.weight", "offset": 4299235328, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.29.attn_q.weight", "offset": 4310769664, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.29.attn_v.weight", "offset": 4322304000, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.3.attn_norm.weight", "offset": 4325187584, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.3.ffn_down.weight", "offset": 4325203968, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.3.ffn_gate.weight", "offset": 4365574144, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.3.ffn_up.weight", "offset": 4405944320, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.3.ffn_norm.weight", "offset": 4446314496, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.3.attn_k.weight", "offset": 4446330880, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.3.attn_output.weight", "offset": 4449214464, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.3.attn_q.weight", "offset": 4460748800, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.3.attn_v.weight", "offset": 4472283136, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.30.attn_norm.weight", "offset": 4475166720, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.30.ffn_down.weight", "offset": 4475183104, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.30.ffn_gate.weight", "offset": 4523352064, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.30.ffn_up.weight", "offset": 4563722240, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.30.ffn_norm.weight", "offset": 4604092416, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.30.attn_k.weight", "offset": 4604108800, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.30.attn_output.weight", "offset": 4606992384, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.30.attn_q.weight", "offset": 4618526720, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.30.attn_v.weight", "offset": 4630061056, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.31.attn_norm.weight", "offset": 4633501696, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.31.ffn_down.weight", "offset": 4633518080, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.31.ffn_gate.weight", "offset": 4673888256, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.31.ffn_up.weight", "offset": 4714258432, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.31.ffn_norm.weight", "offset": 4754628608, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.31.attn_k.weight", "offset": 4754644992, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.31.attn_output.weight", "offset": 4757528576, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.31.attn_q.weight", "offset": 4769062912, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.31.attn_v.weight", "offset": 4780597248, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.4.attn_norm.weight", "offset": 4783480832, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.4.ffn_down.weight", "offset": 4783497216, "shape": [ 14336, 4096 ], "size": 16384, "type": 13 }, { "name": "blk.4.ffn_gate.weight", "offset": 4823867392, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.4.ffn_up.weight", "offset": 4864237568, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.4.ffn_norm.weight", "offset": 4904607744, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.4.attn_k.weight", "offset": 4904624128, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.4.attn_output.weight", "offset": 4907507712, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.4.attn_q.weight", "offset": 4919042048, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.4.attn_v.weight", "offset": 4930576384, "shape": [ 4096, 1024 ], "size": 11534336, "type": 13 }, { "name": "blk.5.attn_norm.weight", "offset": 4933459968, "shape": [ 4096 ], "size": 2883584, "type": 0 }, { "name": "blk.5.ffn_down.weight", "offset": 4933476352, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.5.ffn_gate.weight", "offset": 4981645312, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.5.ffn_up.weight", "offset": 5022015488, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.5.ffn_norm.weight", "offset": 5062385664, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.5.attn_k.weight", "offset": 5062402048, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.5.attn_output.weight", "offset": 5065285632, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.5.attn_q.weight", "offset": 5076819968, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.5.attn_v.weight", "offset": 5088354304, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.6.attn_norm.weight", "offset": 5091794944, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.6.ffn_down.weight", "offset": 5091811328, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.6.ffn_gate.weight", "offset": 5139980288, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.6.ffn_up.weight", "offset": 5180350464, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.6.ffn_norm.weight", "offset": 5220720640, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.6.attn_k.weight", "offset": 5220737024, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.6.attn_output.weight", "offset": 5223620608, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.6.attn_q.weight", "offset": 5235154944, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.6.attn_v.weight", "offset": 5246689280, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.7.attn_norm.weight", "offset": 5250129920, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.7.ffn_down.weight", "offset": 5250146304, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.7.ffn_gate.weight", "offset": 5298315264, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.7.ffn_up.weight", "offset": 5338685440, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.7.ffn_norm.weight", "offset": 5379055616, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.7.attn_k.weight", "offset": 5379072000, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.7.attn_output.weight", "offset": 5381955584, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.7.attn_q.weight", "offset": 5393489920, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.7.attn_v.weight", "offset": 5405024256, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.8.attn_norm.weight", "offset": 5408464896, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.8.ffn_down.weight", "offset": 5408481280, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.8.ffn_gate.weight", "offset": 5456650240, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.8.ffn_up.weight", "offset": 5497020416, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.8.ffn_norm.weight", "offset": 5537390592, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.8.attn_k.weight", "offset": 5537406976, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.8.attn_output.weight", "offset": 5540290560, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "\ufffd\ufffd\u0004\ufffd\ufffd\ufffd\ufffd\ufffd\ufffdi\ufffd\u001a\ufffd\ufffdb\u0019^\ufffd\ufffd", "offset": 5551824896, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.8.attn_v.weight", "offset": 5563359232, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "blk.9.attn_norm.weight", "offset": 5566799872, "shape": [ 4096 ], "size": 3440640, "type": 0 }, { "name": "blk.9.ffn_down.weight", "offset": 5566816256, "shape": [ 14336, 4096 ], "size": 16384, "type": 14 }, { "name": "blk.9.ffn_gate.weight", "offset": 5614985216, "shape": [ 4096, 14336 ], "size": 48168960, "type": 13 }, { "name": "blk.9.ffn_up.weight", "offset": 5655355392, "shape": [ 4096, 14336 ], "size": 40370176, "type": 13 }, { "name": "blk.9.ffn_norm.weight", "offset": 5695725568, "shape": [ 4096 ], "size": 40370176, "type": 0 }, { "name": "blk.9.attn_k.weight", "offset": 5695741952, "shape": [ 4096, 1024 ], "size": 16384, "type": 13 }, { "name": "blk.9.attn_output.weight", "offset": 5698625536, "shape": [ 4096, 4096 ], "size": 2883584, "type": 13 }, { "name": "blk.9.attn_q.weight", "offset": 5710159872, "shape": [ 4096, 4096 ], "size": 11534336, "type": 13 }, { "name": "blk.9.attn_v.weight", "offset": 5721694208, "shape": [ 4096, 1024 ], "size": 11534336, "type": 14 }, { "name": "output_norm.weight", "offset": 5725134848, "shape": [ 4096 ], "size": 3440640, "type": 0 } ], "version": 3 }