KeyLM-75M-Instruct / configuration_keylm.py
Eclipse-Senpai's picture
main commit
a7de577 verified
raw
history blame contribute delete
459 Bytes
"""KeyLM model configuration.
KeyLM-75M is a from-scratch small language model. Its decoder block is a
Qwen3-style layout (grouped-query attention, RoPE, SwiGLU, and per-head
QK-RMSNorm), so the configuration inherits Qwen3Config and only overrides the
``model_type`` so the model carries its own identity on the Hub.
"""
from transformers.models.qwen3.configuration_qwen3 import Qwen3Config
class KeyLM75MConfig(Qwen3Config):
model_type = "keylm75m"