File size: 597 Bytes
6ea104c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
# -*- coding: utf-8 -*-
"""
Subspace Decoder Package
A Transformer decoder implementation with Multi-Head Latent Attention (MLA)
and decomposed MLP layers for efficient parameter usage.
"""
# Import all the main classes from models
from .models import (
SharedSpaceDecoderConfig,
SharedSpaceDecoderPreTrainedModel,
SharedSpaceDecoderModel,
SharedSpaceDecoderForCausalLM,
)
__version__ = "0.1.0"
__all__ = [
"SharedSpaceDecoderConfig",
"SharedSpaceDecoderPreTrainedModel",
"SharedSpaceDecoderModel",
"SharedSpaceDecoderForCausalLM",
]
|