| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| from .baichuan.model import BaichuanForCausalLM |
| from .bert.model import ( |
| BertForQuestionAnswering, |
| BertForSequenceClassification, |
| BertModel, |
| RobertaForQuestionAnswering, |
| RobertaForSequenceClassification, |
| RobertaModel, |
| ) |
| from .bloom.model import BloomForCausalLM, BloomModel |
| from .chatglm.config import ChatGLMConfig |
| from .chatglm.model import ChatGLMForCausalLM, ChatGLMModel |
| from .cogvlm.config import CogVLMConfig |
| from .cogvlm.model import CogVLMForCausalLM |
| from .commandr.model import CohereForCausalLM |
| from .dbrx.config import DbrxConfig |
| from .dbrx.model import DbrxForCausalLM |
| from .deepseek_v1.model import DeepseekForCausalLM |
| from .deepseek_v2.model import DeepseekV2ForCausalLM |
| from .dit.model import DiT |
| from .eagle.model import EagleForCausalLM |
| from .enc_dec.model import DecoderModel, EncoderModel, WhisperEncoder |
| from .f5tts.model import F5TTS |
| from .falcon.config import FalconConfig |
| from .falcon.model import FalconForCausalLM, FalconModel |
| from .gemma.config import GEMMA2_ARCHITECTURE, GEMMA_ARCHITECTURE, GemmaConfig |
| from .gemma.model import GemmaForCausalLM |
| from .gpt.config import GPTConfig |
| from .gpt.model import GPTForCausalLM, GPTModel |
| from .gptj.config import GPTJConfig |
| from .gptj.model import GPTJForCausalLM, GPTJModel |
| from .gptneox.model import GPTNeoXForCausalLM, GPTNeoXModel |
| from .grok.model import GrokForCausalLM |
| from .llama.config import LLaMAConfig |
| from .llama.model import LLaMAForCausalLM, LLaMAModel |
| from .mamba.model import MambaForCausalLM |
| from .medusa.config import MedusaConfig |
| from .medusa.model import MedusaForCausalLm |
| from .mllama.model import MLLaMAModel |
| from .modeling_utils import PretrainedConfig, PretrainedModel, SpeculativeDecodingMode |
| from .mpt.model import MPTForCausalLM, MPTModel |
| from .nemotron_nas.model import DeciLMForCausalLM |
| from .opt.model import OPTForCausalLM, OPTModel |
| from .phi.model import PhiForCausalLM, PhiModel |
| from .phi3.model import Phi3ForCausalLM, Phi3Model |
| from .qwen.model import QWenForCausalLM |
| from .recurrentgemma.model import RecurrentGemmaForCausalLM |
|
|
|
|
| __all__ = [ |
| "BertModel", |
| "BertForQuestionAnswering", |
| "BertForSequenceClassification", |
| "RobertaModel", |
| "RobertaForQuestionAnswering", |
| "RobertaForSequenceClassification", |
| "BloomModel", |
| "BloomForCausalLM", |
| "DiT", |
| "DeepseekForCausalLM", |
| "FalconConfig", |
| "DeepseekV2ForCausalLM", |
| "FalconForCausalLM", |
| "FalconModel", |
| "GPTConfig", |
| "GPTModel", |
| "GPTForCausalLM", |
| "OPTForCausalLM", |
| "OPTModel", |
| "LLaMAConfig", |
| "LLaMAForCausalLM", |
| "LLaMAModel", |
| "MedusaConfig", |
| "MedusaForCausalLm", |
| "GPTJConfig", |
| "GPTJModel", |
| "GPTJForCausalLM", |
| "GPTNeoXModel", |
| "GPTNeoXForCausalLM", |
| "PhiModel", |
| "PhiConfig", |
| "Phi3Model", |
| "Phi3Config", |
| "PhiForCausalLM", |
| "Phi3ForCausalLM", |
| "ChatGLMConfig", |
| "ChatGLMForCausalLM", |
| "ChatGLMModel", |
| "BaichuanForCausalLM", |
| "QWenConfigQWenForCausalLM", |
| "QWenModel", |
| "EncoderModel", |
| "DecoderModel", |
| "PretrainedConfig", |
| "PretrainedModel", |
| "WhisperEncoder", |
| "MambaForCausalLM", |
| "MambaConfig", |
| "MPTForCausalLM", |
| "MPTModel", |
| "SkyworkForCausalLM", |
| "GemmaConfig", |
| "GemmaForCausalLM", |
| "DbrxConfig", |
| "DbrxForCausalLM", |
| "RecurrentGemmaForCausalLM", |
| "CogVLMConfig", |
| "CogVLMForCausalLM", |
| "EagleForCausalLM", |
| "SpeculativeDecodingMode", |
| "CohereForCausalLM", |
| "MLLaMAModel", |
| "F5TTS", |
| ] |
|
|
| MODEL_MAP = { |
| "GPT2LMHeadModel": GPTForCausalLM, |
| "GPT2LMHeadCustomModel": GPTForCausalLM, |
| "GPTBigCodeForCausalLM": GPTForCausalLM, |
| "Starcoder2ForCausalLM": GPTForCausalLM, |
| "FuyuForCausalLM": GPTForCausalLM, |
| "Kosmos2ForConditionalGeneration": GPTForCausalLM, |
| "JAISLMHeadModel": GPTForCausalLM, |
| "GPTForCausalLM": GPTForCausalLM, |
| "NemotronForCausalLM": GPTForCausalLM, |
| "OPTForCausalLM": OPTForCausalLM, |
| "BloomForCausalLM": BloomForCausalLM, |
| "RWForCausalLM": FalconForCausalLM, |
| "FalconForCausalLM": FalconForCausalLM, |
| "PhiForCausalLM": PhiForCausalLM, |
| "Phi3ForCausalLM": Phi3ForCausalLM, |
| "Phi3VForCausalLM": Phi3ForCausalLM, |
| "Phi3SmallForCausalLM": Phi3ForCausalLM, |
| "PhiMoEForCausalLM": Phi3ForCausalLM, |
| "MambaForCausalLM": MambaForCausalLM, |
| "GPTNeoXForCausalLM": GPTNeoXForCausalLM, |
| "GPTJForCausalLM": GPTJForCausalLM, |
| "MPTForCausalLM": MPTForCausalLM, |
| "GLMModel": ChatGLMForCausalLM, |
| "ChatGLMModel": ChatGLMForCausalLM, |
| "ChatGLMForCausalLM": ChatGLMForCausalLM, |
| "LlamaForCausalLM": LLaMAForCausalLM, |
| "ExaoneForCausalLM": LLaMAForCausalLM, |
| "MistralForCausalLM": LLaMAForCausalLM, |
| "MixtralForCausalLM": LLaMAForCausalLM, |
| "ArcticForCausalLM": LLaMAForCausalLM, |
| "Grok1ModelForCausalLM": GrokForCausalLM, |
| "InternLMForCausalLM": LLaMAForCausalLM, |
| "InternLM2ForCausalLM": LLaMAForCausalLM, |
| "MedusaForCausalLM": MedusaForCausalLm, |
| "BaichuanForCausalLM": BaichuanForCausalLM, |
| "BaiChuanForCausalLM": BaichuanForCausalLM, |
| "SkyworkForCausalLM": LLaMAForCausalLM, |
| GEMMA_ARCHITECTURE: GemmaForCausalLM, |
| GEMMA2_ARCHITECTURE: GemmaForCausalLM, |
| "QWenLMHeadModel": QWenForCausalLM, |
| "QWenForCausalLM": QWenForCausalLM, |
| "Qwen2ForCausalLM": QWenForCausalLM, |
| "Qwen2MoeForCausalLM": QWenForCausalLM, |
| "Qwen2ForSequenceClassification": QWenForCausalLM, |
| "Qwen2VLForConditionalGeneration": QWenForCausalLM, |
| "WhisperEncoder": WhisperEncoder, |
| "EncoderModel": EncoderModel, |
| "DecoderModel": DecoderModel, |
| "DbrxForCausalLM": DbrxForCausalLM, |
| "RecurrentGemmaForCausalLM": RecurrentGemmaForCausalLM, |
| "CogVLMForCausalLM": CogVLMForCausalLM, |
| "DiT": DiT, |
| "DeepseekForCausalLM": DeepseekForCausalLM, |
| "DeciLMForCausalLM": DeciLMForCausalLM, |
| "DeepseekV2ForCausalLM": DeepseekV2ForCausalLM, |
| "EagleForCausalLM": EagleForCausalLM, |
| "CohereForCausalLM": CohereForCausalLM, |
| "MllamaForConditionalGeneration": MLLaMAModel, |
| "BertForQuestionAnswering": BertForQuestionAnswering, |
| "BertForSequenceClassification": BertForSequenceClassification, |
| "BertModel": BertModel, |
| "RobertaModel": RobertaModel, |
| "RobertaForQuestionAnswering": RobertaForQuestionAnswering, |
| "RobertaForSequenceClassification": RobertaForSequenceClassification, |
| "F5TTS": F5TTS, |
| } |
|
|