llama3_baseline / __init__.py
smithblack-0's picture
Update architecture and tokenizer
b7858ac verified
raw
history blame contribute delete
397 Bytes
from .attention import GroupedQueryAttention
from .configuration import Llama3Config
from .decoder_layer import DecoderLayer
from .huggingface import Llama3ForCausalLM
from .mlp import SwiGLUMLP
from .model import Llama3Model
from .rope import RotaryEmbedding
__all__ = ["DecoderLayer", "GroupedQueryAttention", "Llama3Config", "Llama3ForCausalLM", "Llama3Model", "RotaryEmbedding", "SwiGLUMLP"]