File size: 555 Bytes
cd2099c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# -*- coding: utf-8 -*-

"""

Subspace Decoder Layers



This module contains the layer implementations for the Shared Subspace Decoder,

including Multi-Head Latent Attention (MLA) and decomposed MLP layers.

"""

# Import the main layer classes
from .mla import MultiheadLatentAttention, RotaryEmbedding
from .feedforward import SubspaceFeedForward
from .task_heads import SharedSpaceDecoderForCausalLM

__all__ = [
    "MultiheadLatentAttention",
    "RotaryEmbedding", 
    "SubspaceFeedForward",
    "SharedSpaceDecoderForCausalLM",
]