| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | from .baichuan.model import BaichuanForCausalLM |
| | from .bert.model import ( |
| | BertForQuestionAnswering, |
| | BertForSequenceClassification, |
| | BertModel, |
| | RobertaForQuestionAnswering, |
| | RobertaForSequenceClassification, |
| | RobertaModel, |
| | ) |
| | from .bloom.model import BloomForCausalLM, BloomModel |
| | from .chatglm.config import ChatGLMConfig |
| | from .chatglm.model import ChatGLMForCausalLM, ChatGLMModel |
| | from .cogvlm.config import CogVLMConfig |
| | from .cogvlm.model import CogVLMForCausalLM |
| | from .commandr.model import CohereForCausalLM |
| | from .dbrx.config import DbrxConfig |
| | from .dbrx.model import DbrxForCausalLM |
| | from .deepseek_v1.model import DeepseekForCausalLM |
| | from .deepseek_v2.model import DeepseekV2ForCausalLM |
| | from .dit.model import DiT |
| | from .eagle.model import EagleForCausalLM |
| | from .enc_dec.model import DecoderModel, EncoderModel, WhisperEncoder |
| | from .f5tts.model import F5TTS |
| | from .falcon.config import FalconConfig |
| | from .falcon.model import FalconForCausalLM, FalconModel |
| | from .gemma.config import GEMMA2_ARCHITECTURE, GEMMA_ARCHITECTURE, GemmaConfig |
| | from .gemma.model import GemmaForCausalLM |
| | from .gpt.config import GPTConfig |
| | from .gpt.model import GPTForCausalLM, GPTModel |
| | from .gptj.config import GPTJConfig |
| | from .gptj.model import GPTJForCausalLM, GPTJModel |
| | from .gptneox.model import GPTNeoXForCausalLM, GPTNeoXModel |
| | from .grok.model import GrokForCausalLM |
| | from .llama.config import LLaMAConfig |
| | from .llama.model import LLaMAForCausalLM, LLaMAModel |
| | from .mamba.model import MambaForCausalLM |
| | from .medusa.config import MedusaConfig |
| | from .medusa.model import MedusaForCausalLm |
| | from .mllama.model import MLLaMAModel |
| | from .modeling_utils import PretrainedConfig, PretrainedModel, SpeculativeDecodingMode |
| | from .mpt.model import MPTForCausalLM, MPTModel |
| | from .nemotron_nas.model import DeciLMForCausalLM |
| | from .opt.model import OPTForCausalLM, OPTModel |
| | from .phi.model import PhiForCausalLM, PhiModel |
| | from .phi3.model import Phi3ForCausalLM, Phi3Model |
| | from .qwen.model import QWenForCausalLM |
| | from .recurrentgemma.model import RecurrentGemmaForCausalLM |
| |
|
| |
|
| | __all__ = [ |
| | "BertModel", |
| | "BertForQuestionAnswering", |
| | "BertForSequenceClassification", |
| | "RobertaModel", |
| | "RobertaForQuestionAnswering", |
| | "RobertaForSequenceClassification", |
| | "BloomModel", |
| | "BloomForCausalLM", |
| | "DiT", |
| | "DeepseekForCausalLM", |
| | "FalconConfig", |
| | "DeepseekV2ForCausalLM", |
| | "FalconForCausalLM", |
| | "FalconModel", |
| | "GPTConfig", |
| | "GPTModel", |
| | "GPTForCausalLM", |
| | "OPTForCausalLM", |
| | "OPTModel", |
| | "LLaMAConfig", |
| | "LLaMAForCausalLM", |
| | "LLaMAModel", |
| | "MedusaConfig", |
| | "MedusaForCausalLm", |
| | "GPTJConfig", |
| | "GPTJModel", |
| | "GPTJForCausalLM", |
| | "GPTNeoXModel", |
| | "GPTNeoXForCausalLM", |
| | "PhiModel", |
| | "PhiConfig", |
| | "Phi3Model", |
| | "Phi3Config", |
| | "PhiForCausalLM", |
| | "Phi3ForCausalLM", |
| | "ChatGLMConfig", |
| | "ChatGLMForCausalLM", |
| | "ChatGLMModel", |
| | "BaichuanForCausalLM", |
| | "QWenConfigQWenForCausalLM", |
| | "QWenModel", |
| | "EncoderModel", |
| | "DecoderModel", |
| | "PretrainedConfig", |
| | "PretrainedModel", |
| | "WhisperEncoder", |
| | "MambaForCausalLM", |
| | "MambaConfig", |
| | "MPTForCausalLM", |
| | "MPTModel", |
| | "SkyworkForCausalLM", |
| | "GemmaConfig", |
| | "GemmaForCausalLM", |
| | "DbrxConfig", |
| | "DbrxForCausalLM", |
| | "RecurrentGemmaForCausalLM", |
| | "CogVLMConfig", |
| | "CogVLMForCausalLM", |
| | "EagleForCausalLM", |
| | "SpeculativeDecodingMode", |
| | "CohereForCausalLM", |
| | "MLLaMAModel", |
| | "F5TTS", |
| | ] |
| |
|
| | MODEL_MAP = { |
| | "GPT2LMHeadModel": GPTForCausalLM, |
| | "GPT2LMHeadCustomModel": GPTForCausalLM, |
| | "GPTBigCodeForCausalLM": GPTForCausalLM, |
| | "Starcoder2ForCausalLM": GPTForCausalLM, |
| | "FuyuForCausalLM": GPTForCausalLM, |
| | "Kosmos2ForConditionalGeneration": GPTForCausalLM, |
| | "JAISLMHeadModel": GPTForCausalLM, |
| | "GPTForCausalLM": GPTForCausalLM, |
| | "NemotronForCausalLM": GPTForCausalLM, |
| | "OPTForCausalLM": OPTForCausalLM, |
| | "BloomForCausalLM": BloomForCausalLM, |
| | "RWForCausalLM": FalconForCausalLM, |
| | "FalconForCausalLM": FalconForCausalLM, |
| | "PhiForCausalLM": PhiForCausalLM, |
| | "Phi3ForCausalLM": Phi3ForCausalLM, |
| | "Phi3VForCausalLM": Phi3ForCausalLM, |
| | "Phi3SmallForCausalLM": Phi3ForCausalLM, |
| | "PhiMoEForCausalLM": Phi3ForCausalLM, |
| | "MambaForCausalLM": MambaForCausalLM, |
| | "GPTNeoXForCausalLM": GPTNeoXForCausalLM, |
| | "GPTJForCausalLM": GPTJForCausalLM, |
| | "MPTForCausalLM": MPTForCausalLM, |
| | "GLMModel": ChatGLMForCausalLM, |
| | "ChatGLMModel": ChatGLMForCausalLM, |
| | "ChatGLMForCausalLM": ChatGLMForCausalLM, |
| | "LlamaForCausalLM": LLaMAForCausalLM, |
| | "ExaoneForCausalLM": LLaMAForCausalLM, |
| | "MistralForCausalLM": LLaMAForCausalLM, |
| | "MixtralForCausalLM": LLaMAForCausalLM, |
| | "ArcticForCausalLM": LLaMAForCausalLM, |
| | "Grok1ModelForCausalLM": GrokForCausalLM, |
| | "InternLMForCausalLM": LLaMAForCausalLM, |
| | "InternLM2ForCausalLM": LLaMAForCausalLM, |
| | "MedusaForCausalLM": MedusaForCausalLm, |
| | "BaichuanForCausalLM": BaichuanForCausalLM, |
| | "BaiChuanForCausalLM": BaichuanForCausalLM, |
| | "SkyworkForCausalLM": LLaMAForCausalLM, |
| | GEMMA_ARCHITECTURE: GemmaForCausalLM, |
| | GEMMA2_ARCHITECTURE: GemmaForCausalLM, |
| | "QWenLMHeadModel": QWenForCausalLM, |
| | "QWenForCausalLM": QWenForCausalLM, |
| | "Qwen2ForCausalLM": QWenForCausalLM, |
| | "Qwen2MoeForCausalLM": QWenForCausalLM, |
| | "Qwen2ForSequenceClassification": QWenForCausalLM, |
| | "Qwen2VLForConditionalGeneration": QWenForCausalLM, |
| | "WhisperEncoder": WhisperEncoder, |
| | "EncoderModel": EncoderModel, |
| | "DecoderModel": DecoderModel, |
| | "DbrxForCausalLM": DbrxForCausalLM, |
| | "RecurrentGemmaForCausalLM": RecurrentGemmaForCausalLM, |
| | "CogVLMForCausalLM": CogVLMForCausalLM, |
| | "DiT": DiT, |
| | "DeepseekForCausalLM": DeepseekForCausalLM, |
| | "DeciLMForCausalLM": DeciLMForCausalLM, |
| | "DeepseekV2ForCausalLM": DeepseekV2ForCausalLM, |
| | "EagleForCausalLM": EagleForCausalLM, |
| | "CohereForCausalLM": CohereForCausalLM, |
| | "MllamaForConditionalGeneration": MLLaMAModel, |
| | "BertForQuestionAnswering": BertForQuestionAnswering, |
| | "BertForSequenceClassification": BertForSequenceClassification, |
| | "BertModel": BertModel, |
| | "RobertaModel": RobertaModel, |
| | "RobertaForQuestionAnswering": RobertaForQuestionAnswering, |
| | "RobertaForSequenceClassification": RobertaForSequenceClassification, |
| | "F5TTS": F5TTS, |
| | } |
| |
|