|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from .baichuan.model import BaichuanForCausalLM |
|
|
from .bert.model import (BertForQuestionAnswering, |
|
|
BertForSequenceClassification, BertModel) |
|
|
from .bloom.model import BloomForCausalLM, BloomModel |
|
|
from .chatglm.model import ChatGLMForCausalLM, ChatGLMModel |
|
|
from .cogvlm.config import CogVLMConfig |
|
|
from .cogvlm.model import CogVLMForCausalLM |
|
|
from .dbrx.config import DbrxConfig |
|
|
from .dbrx.model import DbrxForCausalLM |
|
|
from .dit.model import DiT |
|
|
from .enc_dec.model import DecoderModel, EncoderModel, WhisperEncoder |
|
|
from .falcon.model import FalconForCausalLM, FalconModel |
|
|
from .gemma.model import GemmaForCausalLM |
|
|
from .gpt.config import GPTConfig |
|
|
from .gpt.model import GPTForCausalLM, GPTModel |
|
|
from .gptj.model import GPTJForCausalLM, GPTJModel |
|
|
from .gptneox.model import GPTNeoXForCausalLM, GPTNeoXModel |
|
|
from .grok.model import GrokForCausalLM |
|
|
from .llama.config import LLaMAConfig |
|
|
from .llama.model import LLaMAForCausalLM, LLaMAModel |
|
|
from .mamba.model import MambaForCausalLM |
|
|
from .medusa.config import MedusaConfig |
|
|
from .medusa.model import MedusaForCausalLm |
|
|
from .modeling_utils import (PretrainedConfig, PretrainedModel, |
|
|
SpeculativeDecodingMode) |
|
|
from .mpt.model import MPTForCausalLM, MPTModel |
|
|
from .opt.model import OPTForCausalLM, OPTModel |
|
|
from .phi3.model import Phi3ForCausalLM, Phi3Model |
|
|
from .phi.model import PhiForCausalLM, PhiModel |
|
|
from .qwen.model import QWenForCausalLM |
|
|
from .recurrentgemma.model import RecurrentGemmaForCausalLM |
|
|
from .redrafter.model import ReDrafterForCausalLM |
|
|
|
|
|
__all__ = [ |
|
|
'BertModel', |
|
|
'BertForQuestionAnswering', |
|
|
'BertForSequenceClassification', |
|
|
'BloomModel', |
|
|
'BloomForCausalLM', |
|
|
'DiT', |
|
|
'FalconForCausalLM', |
|
|
'FalconModel', |
|
|
'GPTConfig', |
|
|
'GPTModel', |
|
|
'GPTForCausalLM', |
|
|
'OPTForCausalLM', |
|
|
'OPTModel', |
|
|
'LLaMAConfig', |
|
|
'LLaMAForCausalLM', |
|
|
'LLaMAModel', |
|
|
'MedusaConfig', |
|
|
'MedusaForCausalLm', |
|
|
'ReDrafterForCausalLM', |
|
|
'GPTJModel', |
|
|
'GPTJForCausalLM', |
|
|
'GPTNeoXModel', |
|
|
'GPTNeoXForCausalLM', |
|
|
'PhiModel', |
|
|
'Phi3Model', |
|
|
'PhiForCausalLM', |
|
|
'Phi3ForCausalLM', |
|
|
'ChatGLMForCausalLM', |
|
|
'ChatGLMModel', |
|
|
'BaichuanForCausalLM', |
|
|
'QWenConfig' |
|
|
'QWenForCausalLM', |
|
|
'QWenModel', |
|
|
'EncoderModel', |
|
|
'DecoderModel', |
|
|
'PretrainedConfig', |
|
|
'PretrainedModel', |
|
|
'WhisperEncoder', |
|
|
'MambaForCausalLM', |
|
|
'MPTForCausalLM', |
|
|
'MPTModel', |
|
|
'SkyworkForCausalLM', |
|
|
'GemmaForCausalLM', |
|
|
'DbrxConfig', |
|
|
'DbrxForCausalLM', |
|
|
'RecurrentGemmaForCausalLM', |
|
|
'CogVLMConfig', |
|
|
'CogVLMForCausalLM', |
|
|
'SpeculativeDecodingMode', |
|
|
] |
|
|
|
|
|
MODEL_MAP = { |
|
|
'GPT2LMHeadModel': GPTForCausalLM, |
|
|
'GPT2LMHeadCustomModel': GPTForCausalLM, |
|
|
'GPTBigCodeForCausalLM': GPTForCausalLM, |
|
|
'Starcoder2ForCausalLM': GPTForCausalLM, |
|
|
'FuyuForCausalLM': GPTForCausalLM, |
|
|
'Kosmos2ForConditionalGeneration': GPTForCausalLM, |
|
|
'JAISLMHeadModel': GPTForCausalLM, |
|
|
'GPTForCausalLM': GPTForCausalLM, |
|
|
'OPTForCausalLM': OPTForCausalLM, |
|
|
'BloomForCausalLM': BloomForCausalLM, |
|
|
'RWForCausalLM': FalconForCausalLM, |
|
|
'FalconForCausalLM': FalconForCausalLM, |
|
|
'PhiForCausalLM': PhiForCausalLM, |
|
|
'Phi3ForCausalLM': Phi3ForCausalLM, |
|
|
'Phi3SmallForCausalLM': Phi3ForCausalLM, |
|
|
'MambaForCausalLM': MambaForCausalLM, |
|
|
'GPTNeoXForCausalLM': GPTNeoXForCausalLM, |
|
|
'GPTJForCausalLM': GPTJForCausalLM, |
|
|
'MPTForCausalLM': MPTForCausalLM, |
|
|
'GLMModel': ChatGLMForCausalLM, |
|
|
'ChatGLMModel': ChatGLMForCausalLM, |
|
|
'ChatGLMForCausalLM': ChatGLMForCausalLM, |
|
|
'LlamaForCausalLM': LLaMAForCausalLM, |
|
|
'MistralForCausalLM': LLaMAForCausalLM, |
|
|
'MixtralForCausalLM': LLaMAForCausalLM, |
|
|
'ArcticForCausalLM': LLaMAForCausalLM, |
|
|
'Grok1ModelForCausalLM': GrokForCausalLM, |
|
|
'InternLMForCausalLM': LLaMAForCausalLM, |
|
|
'InternLM2ForCausalLM': LLaMAForCausalLM, |
|
|
'MedusaForCausalLM': MedusaForCausalLm, |
|
|
'ReDrafterForCausalLM': ReDrafterForCausalLM, |
|
|
'BaichuanForCausalLM': BaichuanForCausalLM, |
|
|
'BaiChuanForCausalLM': BaichuanForCausalLM, |
|
|
'SkyworkForCausalLM': LLaMAForCausalLM, |
|
|
'GemmaForCausalLM': GemmaForCausalLM, |
|
|
'QWenLMHeadModel': QWenForCausalLM, |
|
|
'QWenForCausalLM': QWenForCausalLM, |
|
|
'Qwen2ForCausalLM': QWenForCausalLM, |
|
|
'Qwen2MoeForCausalLM': QWenForCausalLM, |
|
|
'WhisperEncoder': WhisperEncoder, |
|
|
'EncoderModel': EncoderModel, |
|
|
'DecoderModel': DecoderModel, |
|
|
'DbrxForCausalLM': DbrxForCausalLM, |
|
|
'RecurrentGemmaForCausalLM': RecurrentGemmaForCausalLM, |
|
|
'CogVLMForCausalLM': CogVLMForCausalLM, |
|
|
'DiT': DiT, |
|
|
} |
|
|
|