https://huggingface.co/gorilla-llm/gorilla-openfunctions-v2-gguf
7B
1,166 Pulls Updated 6 months ago
f23ce98c7a23 · 3.7GB
-
general.architecturellama
-
general.file_typeQ3_K_L
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count30
-
llama.context_length4096
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.bos_token_id100000
-
tokenizer.ggml.eos_token_id100015
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id100001
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ3_K[4096 102400]
-
blk.0.attn_q.weightQ3_K[4096 4096]
-
blk.0.attn_k.weightQ3_K[4096 4096]
-
blk.0.attn_v.weightQ5_K[4096 4096]
-
blk.0.attn_output.weightQ5_K[4096 4096]
-
blk.0.ffn_gate.weightQ3_K[4096 11008]
-
blk.0.ffn_up.weightQ3_K[4096 11008]
-
blk.0.ffn_down.weightQ5_K[11008 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.1.attn_q.weightQ3_K[4096 4096]
-
blk.1.attn_k.weightQ3_K[4096 4096]
-
blk.1.attn_v.weightQ5_K[4096 4096]
-
blk.1.attn_output.weightQ5_K[4096 4096]
-
blk.1.ffn_gate.weightQ3_K[4096 11008]
-
blk.1.ffn_up.weightQ3_K[4096 11008]
-
blk.1.ffn_down.weightQ5_K[11008 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.2.attn_q.weightQ3_K[4096 4096]
-
blk.2.attn_k.weightQ3_K[4096 4096]
-
blk.2.attn_v.weightQ5_K[4096 4096]
-
blk.2.attn_output.weightQ5_K[4096 4096]
-
blk.2.ffn_gate.weightQ3_K[4096 11008]
-
blk.2.ffn_up.weightQ3_K[4096 11008]
-
blk.2.ffn_down.weightQ5_K[11008 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.3.attn_q.weightQ3_K[4096 4096]
-
blk.3.attn_k.weightQ3_K[4096 4096]
-
blk.3.attn_v.weightQ5_K[4096 4096]
-
blk.3.attn_output.weightQ5_K[4096 4096]
-
blk.3.ffn_gate.weightQ3_K[4096 11008]
-
blk.3.ffn_up.weightQ3_K[4096 11008]
-
blk.3.ffn_down.weightQ5_K[11008 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.4.attn_q.weightQ3_K[4096 4096]
-
blk.4.attn_k.weightQ3_K[4096 4096]
-
blk.4.attn_v.weightQ5_K[4096 4096]
-
blk.4.attn_output.weightQ5_K[4096 4096]
-
blk.4.ffn_gate.weightQ3_K[4096 11008]
-
blk.4.ffn_up.weightQ3_K[4096 11008]
-
blk.4.ffn_down.weightQ5_K[11008 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.5.attn_q.weightQ3_K[4096 4096]
-
blk.5.attn_k.weightQ3_K[4096 4096]
-
blk.5.attn_v.weightQ5_K[4096 4096]
-
blk.5.attn_output.weightQ5_K[4096 4096]
-
blk.5.ffn_gate.weightQ3_K[4096 11008]
-
blk.5.ffn_up.weightQ3_K[4096 11008]
-
blk.5.ffn_down.weightQ5_K[11008 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_q.weightQ3_K[4096 4096]
-
blk.6.attn_k.weightQ3_K[4096 4096]
-
blk.6.attn_v.weightQ5_K[4096 4096]
-
blk.6.attn_output.weightQ5_K[4096 4096]
-
blk.6.ffn_gate.weightQ3_K[4096 11008]
-
blk.6.ffn_up.weightQ3_K[4096 11008]
-
blk.6.ffn_down.weightQ5_K[11008 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.7.attn_q.weightQ3_K[4096 4096]
-
blk.7.attn_k.weightQ3_K[4096 4096]
-
blk.7.attn_v.weightQ5_K[4096 4096]
-
blk.7.attn_output.weightQ5_K[4096 4096]
-
blk.7.ffn_gate.weightQ3_K[4096 11008]
-
blk.7.ffn_up.weightQ3_K[4096 11008]
-
blk.7.ffn_down.weightQ5_K[11008 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.8.attn_q.weightQ3_K[4096 4096]
-
blk.8.attn_k.weightQ3_K[4096 4096]
-
blk.8.attn_v.weightQ5_K[4096 4096]
-
blk.8.attn_output.weightQ5_K[4096 4096]
-
blk.8.ffn_gate.weightQ3_K[4096 11008]
-
blk.8.ffn_up.weightQ3_K[4096 11008]
-
blk.8.ffn_down.weightQ5_K[11008 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.9.attn_q.weightQ3_K[4096 4096]
-
blk.9.attn_k.weightQ3_K[4096 4096]
-
blk.9.attn_v.weightQ5_K[4096 4096]
-
blk.9.attn_output.weightQ5_K[4096 4096]
-
blk.9.ffn_gate.weightQ3_K[4096 11008]
-
blk.9.ffn_up.weightQ3_K[4096 11008]
-
blk.9.ffn_down.weightQ5_K[11008 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.10.attn_q.weightQ3_K[4096 4096]
-
blk.10.attn_k.weightQ3_K[4096 4096]
-
blk.10.attn_v.weightQ5_K[4096 4096]
-
blk.10.attn_output.weightQ5_K[4096 4096]
-
blk.10.ffn_gate.weightQ3_K[4096 11008]
-
blk.10.ffn_up.weightQ3_K[4096 11008]
-
blk.10.ffn_down.weightQ5_K[11008 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_q.weightQ3_K[4096 4096]
-
blk.11.attn_k.weightQ3_K[4096 4096]
-
blk.11.attn_v.weightQ5_K[4096 4096]
-
blk.11.attn_output.weightQ5_K[4096 4096]
-
blk.11.ffn_gate.weightQ3_K[4096 11008]
-
blk.11.ffn_up.weightQ3_K[4096 11008]
-
blk.11.ffn_down.weightQ5_K[11008 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_q.weightQ3_K[4096 4096]
-
blk.12.attn_k.weightQ3_K[4096 4096]
-
blk.12.attn_v.weightQ5_K[4096 4096]
-
blk.12.attn_output.weightQ5_K[4096 4096]
-
blk.12.ffn_gate.weightQ3_K[4096 11008]
-
blk.12.ffn_up.weightQ3_K[4096 11008]
-
blk.12.ffn_down.weightQ5_K[11008 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_q.weightQ3_K[4096 4096]
-
blk.13.attn_k.weightQ3_K[4096 4096]
-
blk.13.attn_v.weightQ5_K[4096 4096]
-
blk.13.attn_output.weightQ5_K[4096 4096]
-
blk.13.ffn_gate.weightQ3_K[4096 11008]
-
blk.13.ffn_up.weightQ3_K[4096 11008]
-
blk.13.ffn_down.weightQ5_K[11008 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.14.attn_q.weightQ3_K[4096 4096]
-
blk.14.attn_k.weightQ3_K[4096 4096]
-
blk.14.attn_v.weightQ5_K[4096 4096]
-
blk.14.attn_output.weightQ5_K[4096 4096]
-
blk.14.ffn_gate.weightQ3_K[4096 11008]
-
blk.14.ffn_up.weightQ3_K[4096 11008]
-
blk.14.ffn_down.weightQ5_K[11008 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.15.attn_q.weightQ3_K[4096 4096]
-
blk.15.attn_k.weightQ3_K[4096 4096]
-
blk.15.attn_v.weightQ5_K[4096 4096]
-
blk.15.attn_output.weightQ5_K[4096 4096]
-
blk.15.ffn_gate.weightQ3_K[4096 11008]
-
blk.15.ffn_up.weightQ3_K[4096 11008]
-
blk.15.ffn_down.weightQ5_K[11008 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.16.attn_q.weightQ3_K[4096 4096]
-
blk.16.attn_k.weightQ3_K[4096 4096]
-
blk.16.attn_v.weightQ5_K[4096 4096]
-
blk.16.attn_output.weightQ5_K[4096 4096]
-
blk.16.ffn_gate.weightQ3_K[4096 11008]
-
blk.16.ffn_up.weightQ3_K[4096 11008]
-
blk.16.ffn_down.weightQ5_K[11008 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.17.attn_q.weightQ3_K[4096 4096]
-
blk.17.attn_k.weightQ3_K[4096 4096]
-
blk.17.attn_v.weightQ5_K[4096 4096]
-
blk.17.attn_output.weightQ5_K[4096 4096]
-
blk.17.ffn_gate.weightQ3_K[4096 11008]
-
blk.17.ffn_up.weightQ3_K[4096 11008]
-
blk.17.ffn_down.weightQ5_K[11008 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_q.weightQ3_K[4096 4096]
-
blk.18.attn_k.weightQ3_K[4096 4096]
-
blk.18.attn_v.weightQ5_K[4096 4096]
-
blk.18.attn_output.weightQ5_K[4096 4096]
-
blk.18.ffn_gate.weightQ3_K[4096 11008]
-
blk.18.ffn_up.weightQ3_K[4096 11008]
-
blk.18.ffn_down.weightQ5_K[11008 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.19.attn_q.weightQ3_K[4096 4096]
-
blk.19.attn_k.weightQ3_K[4096 4096]
-
blk.19.attn_v.weightQ5_K[4096 4096]
-
blk.19.attn_output.weightQ5_K[4096 4096]
-
blk.19.ffn_gate.weightQ3_K[4096 11008]
-
blk.19.ffn_up.weightQ3_K[4096 11008]
-
blk.19.ffn_down.weightQ5_K[11008 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.20.attn_q.weightQ3_K[4096 4096]
-
blk.20.attn_k.weightQ3_K[4096 4096]
-
blk.20.attn_v.weightQ5_K[4096 4096]
-
blk.20.attn_output.weightQ5_K[4096 4096]
-
blk.20.ffn_gate.weightQ3_K[4096 11008]
-
blk.20.ffn_up.weightQ3_K[4096 11008]
-
blk.20.ffn_down.weightQ5_K[11008 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.21.attn_q.weightQ3_K[4096 4096]
-
blk.21.attn_k.weightQ3_K[4096 4096]
-
blk.21.attn_v.weightQ5_K[4096 4096]
-
blk.21.attn_output.weightQ5_K[4096 4096]
-
blk.21.ffn_gate.weightQ3_K[4096 11008]
-
blk.21.ffn_up.weightQ3_K[4096 11008]
-
blk.21.ffn_down.weightQ5_K[11008 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.22.attn_q.weightQ3_K[4096 4096]
-
blk.22.attn_k.weightQ3_K[4096 4096]
-
blk.22.attn_v.weightQ5_K[4096 4096]
-
blk.22.attn_output.weightQ5_K[4096 4096]
-
blk.22.ffn_gate.weightQ3_K[4096 11008]
-
blk.22.ffn_up.weightQ3_K[4096 11008]
-
blk.22.ffn_down.weightQ5_K[11008 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_q.weightQ3_K[4096 4096]
-
blk.23.attn_k.weightQ3_K[4096 4096]
-
blk.23.attn_v.weightQ5_K[4096 4096]
-
blk.23.attn_output.weightQ5_K[4096 4096]
-
blk.23.ffn_gate.weightQ3_K[4096 11008]
-
blk.23.ffn_up.weightQ3_K[4096 11008]
-
blk.23.ffn_down.weightQ5_K[11008 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_q.weightQ3_K[4096 4096]
-
blk.24.attn_k.weightQ3_K[4096 4096]
-
blk.24.attn_v.weightQ5_K[4096 4096]
-
blk.24.attn_output.weightQ5_K[4096 4096]
-
blk.24.ffn_gate.weightQ3_K[4096 11008]
-
blk.24.ffn_up.weightQ3_K[4096 11008]
-
blk.24.ffn_down.weightQ5_K[11008 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.25.attn_q.weightQ3_K[4096 4096]
-
blk.25.attn_k.weightQ3_K[4096 4096]
-
blk.25.attn_v.weightQ5_K[4096 4096]
-
blk.25.attn_output.weightQ5_K[4096 4096]
-
blk.25.ffn_gate.weightQ3_K[4096 11008]
-
blk.25.ffn_up.weightQ3_K[4096 11008]
-
blk.25.ffn_down.weightQ5_K[11008 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.26.attn_q.weightQ3_K[4096 4096]
-
blk.26.attn_k.weightQ3_K[4096 4096]
-
blk.26.attn_v.weightQ5_K[4096 4096]
-
blk.26.attn_output.weightQ5_K[4096 4096]
-
blk.26.ffn_gate.weightQ3_K[4096 11008]
-
blk.26.ffn_up.weightQ3_K[4096 11008]
-
blk.26.ffn_down.weightQ5_K[11008 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.27.attn_q.weightQ3_K[4096 4096]
-
blk.27.attn_k.weightQ3_K[4096 4096]
-
blk.27.attn_v.weightQ5_K[4096 4096]
-
blk.27.attn_output.weightQ5_K[4096 4096]
-
blk.27.ffn_gate.weightQ3_K[4096 11008]
-
blk.27.ffn_up.weightQ3_K[4096 11008]
-
blk.27.ffn_down.weightQ5_K[11008 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.28.attn_q.weightQ3_K[4096 4096]
-
blk.28.attn_k.weightQ3_K[4096 4096]
-
blk.28.attn_v.weightQ5_K[4096 4096]
-
blk.28.attn_output.weightQ5_K[4096 4096]
-
blk.28.ffn_gate.weightQ3_K[4096 11008]
-
blk.28.ffn_up.weightQ3_K[4096 11008]
-
blk.28.ffn_down.weightQ5_K[11008 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.29.attn_q.weightQ3_K[4096 4096]
-
blk.29.attn_k.weightQ3_K[4096 4096]
-
blk.29.attn_v.weightQ5_K[4096 4096]
-
blk.29.attn_output.weightQ5_K[4096 4096]
-
blk.29.ffn_gate.weightQ3_K[4096 11008]
-
blk.29.ffn_up.weightQ3_K[4096 11008]
-
blk.29.ffn_down.weightQ5_K[11008 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
output_norm.weightF32[4096]
-
output.weightQ6_K[4096 102400]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29