free02/ glm5.1:part1

149 1 month ago

01753c4cbfda · 9.4MB
    Metadata
  • general.architecture
    glm-dsa
  • general.file_type
    IQ2_M
  • glm-dsa.attention.head_count
    64
  • glm-dsa.attention.head_count_kv
    1
  • glm-dsa.attention.indexer.head_count
    32
  • glm-dsa.attention.indexer.key_length
    128
  • glm-dsa.attention.indexer.top_k
    2048
  • glm-dsa.attention.key_length
    576
  • glm-dsa.attention.key_length_mla
    256
  • glm-dsa.attention.kv_lora_rank
    512
  • glm-dsa.attention.layer_norm_rms_epsilon
    1e-05
  • glm-dsa.attention.q_lora_rank
    2048
  • glm-dsa.attention.value_length
    512
  • glm-dsa.attention.value_length_mla
    256
  • glm-dsa.block_count
    79
  • glm-dsa.context_length
    202752
  • glm-dsa.embedding_length
    6144
  • glm-dsa.expert_count
    256
  • glm-dsa.expert_feed_forward_length
    2048
  • glm-dsa.expert_gating_func
    2
  • glm-dsa.expert_group_count
    1
  • glm-dsa.expert_group_used_count
    1
  • glm-dsa.expert_shared_count
    1
  • glm-dsa.expert_used_count
    8
  • glm-dsa.expert_weights_norm
    true
  • glm-dsa.expert_weights_scale
    2.5
  • glm-dsa.feed_forward_length
    12288
  • glm-dsa.leading_dense_block_count
    3
  • glm-dsa.nextn_predict_layers
    1
  • glm-dsa.rope.dimension_count
    64
  • glm-dsa.rope.freq_base
    1e+06
  • glm-dsa.vocab_size
    154880
  • tokenizer.ggml.bos_token_id
    154822
  • tokenizer.ggml.eom_token_id
    154829
  • tokenizer.ggml.eos_token_id
    154820
  • tokenizer.ggml.eot_token_id
    154827
  • tokenizer.ggml.merges
    [Ġ Ġ, Ġ ĠĠĠ, ĠĠ ĠĠ, ĠĠĠ Ġ, i n, ...]
  • tokenizer.ggml.model
    gpt2
  • tokenizer.ggml.padding_token_id
    154821
  • tokenizer.ggml.pre
    glm4
  • tokenizer.ggml.token_type
    [1, 1, 1, 1, 1, ...]
  • tokenizer.ggml.tokens
    [!, ", #, $, %, ...]
  • tokenizer.ggml.unknown_token_id
    154820
  • quantize.imatrix.chunks_count
    78
  • quantize.imatrix.dataset
    unsloth_calibration_GLM-5.1.txt
  • quantize.imatrix.entries_count
    1002
  • quantize.imatrix.file
    GLM-5.1-GGUF/imatrix_unsloth.gguf
  • split.count
    6
  • split.no
    0
  • split.tensors.count
    1809
  • Tensor