llama3_baseline_dev / __init__.py
smithblack-0's picture
Update architecture and tokenizer
98abb50 verified
Raw
History Blame Contribute Delete
397 Bytes
from .attention import GroupedQueryAttention
from .configuration import Llama3Config
from .decoder_layer import DecoderLayer
from .huggingface import Llama3ForCausalLM
from .mlp import SwiGLUMLP
from .model import Llama3Model
from .rope import RotaryEmbedding
__all__ = ["DecoderLayer", "GroupedQueryAttention", "Llama3Config", "Llama3ForCausalLM", "Llama3Model", "RotaryEmbedding", "SwiGLUMLP"]