optimum/habana/transformers/models/__init__.py (352 lines of code) (raw):

from .albert import gaudi_albert_forward from .baichuan import ( BaichuanConfig, BaichuanForCausalLM, BaichuanTokenizer, ) from .bart import ( gaudi_BartAttention_forward, gaudi_BartDecoder_forward, gaudi_BartDecoderLayer_forward, gaudi_BartEncoder_forward, gaudi_BartEncoderLayer_forward, gaudi_BartForConditionalGeneration_forward, gaudi_BartForConditionalGeneration_prepare_inputs_for_generation, gaudi_BartLearnedPositionalEmbedding, gaudi_BartModel_forward, ) from .bert import gaudi_BertModel_forward from .blip import ( gaudi_BlipForConditionalGeneration_generate, gaudi_BlipForQuestionAnswering_generate, gaudi_BlipTextAttention_forward, gaudi_BlipTextEncoder_forward, gaudi_BlipTextLayer_forward, gaudi_BlipTextLMHead_forward, gaudi_BlipTextLMHead_prepare_inputs_for_generation, gaudi_BlipTextModel_forward, gaudi_BlipTextSelfAttention_forward, ) from .bloom import ( GaudiBloomForCausalLM, GaudiBloomMLP, gaudi_bloom_attention_forward, gaudi_bloom_block_forward, gaudi_bloom_convert_to_bloom_cache, gaudi_bloom_convert_to_standard_cache, gaudi_bloom_model_forward, ) from .chatglm import ( ChatGLMConfig, ChatGLMForConditionalGeneration, ChatGLMForSequenceClassification, ChatGLMTokenizer, ) from .clip import ( GaudiCLIPAttention, GaudiCLIPEncoder, GaudiCLIPEncoderLayer, GaudiCLIPVisionEmbeddings, GaudiCLIPVisionModel, GaudiCLIPVisionTransformer, ) from .codegen import ( GaudiCodeGenAttention, GaudiCodeGenForCausalLM, gaudi_codegen_block_forward, gaudi_codegen_model_forward, ) from .cohere import ( GaudiCohereAttention, GaudiCohereDecoderLayer, GaudiCohereForCausalLM, gaudi_cohere_model_forward, ) from .decilm import ( DeciLMConfig, DeciLMForCausalLM, ) from .deepseek_v2 import ( DeepseekTokenizerFast, DeepseekV2Config, DeepseekV2ForCausalLM, ) from .deepseek_v3 import ( DeepseekV3Config, DeepseekV3ForCausalLM, ) from .detr import ( gaudi_DetrConvModel_forward, gaudi_DetrHungarianMatcher_forward, gaudi_DetrLoss_forward, gaudi_DetrLoss_loss_boxes, gaudi_DetrLoss_loss_cardinality, gaudi_DetrLoss_loss_labels, ) from .esm import ( gaudi_esm_for_protein_folding_forward, gaudi_esmfolding_trunk_forward, gaudi_rot_matmul, gaudi_rot_vec_mul, ) from .falcon import ( GaudiFalconAttention, GaudiFalconDecoderLayer, GaudiFalconForCausalLM, GaudiFalconMLP, GaudiFalconModel, gaudi_falcon_linear_forward, ) from .falcon_mamba import ( gaudi_FalconMambaForCausalLM_prepare_inputs_for_generation, gaudi_FalconMambaModel_forward, ) from .gemma import ( GaudiGemmaAttention, GaudiGemmaDecoderLayer, GaudiGemmaForCausalLM, GaudiGemmaMLP, GaudiGemmaModel, ) from .gemma2 import ( GaudiGemma2Attention, GaudiGemma2DecoderLayer, GaudiGemma2ForCausalLM, GaudiGemma2MLP, GaudiGemma2Model, GaudiGemma2RotaryEmbedding, ) from .glm4v import ( ChatGLM4Tokenizer, GLM4VConfig, GLM4VForConditionalGeneration, GLM4VForSequenceClassification, ) from .gpt2 import ( GaudiGPT2Attention, GaudiGPT2Block, GaudiGPT2DoubleHeadsModel, GaudiGPT2LMHeadModel, gaudi_gpt2_forward, ) from .gpt_bigcode import ( GaudiGPTBigCodeAttention, GaudiGPTBigCodeForCausalLM, gaudi_gpt_bigcode_block_forward, gaudi_gpt_bigcode_model_forward, ) from .gpt_neo import ( GaudiGPTNeoForCausalLM, gaudi_gpt_neo_attention_forward, gaudi_gpt_neo_block_forward, gaudi_gpt_neo_model_forward, gaudi_gpt_neo_selfattention_forward, ) from .gpt_neox import ( GaudiGPTNeoXAttention, GaudiGPTNeoXForCausalLM, GaudiGPTNeoXLayer, gaudi_gpt_neox_model_forward, ) from .gptj import ( GaudiGPTJAttention, GaudiGPTJBlock, GaudiGPTJForCausalLM, GaudiGPTJModel, ) from .idefics2 import ( Gaudi2Idefics2ImageProcessor, GaudiIdefics2ForConditionalGeneration, GaudiIdefics2Model, GaudiIdefics2VisionEmbeddings, ) from .llama import ( GaudiLlamaAttention, GaudiLlamaDecoderLayer, GaudiLlamaForCausalLM, GaudiLlamaMLP, GaudiLlamaModel, GaudiLlamaRotaryEmbedding, LlamaConfig, gaudi_llama_rmsnorm_forward, ) from .llava import GaudiLlavaForConditionalGeneration from .llava_next import GaudiLlavaNextForConditionalGeneration from .llava_onevision import GaudiLlavaOnevisionForConditionalGeneration from .mamba import ( gaudi_MambaForCausalLM_prepare_inputs_for_generation, gaudi_MambaForCausalLM_update_model_kwargs_for_generation, ) from .minicpm import MiniCPM3Config, MiniCPM3ForCausalLM from .mistral import ( GaudiMistralAttention, GaudiMistralDecoderLayer, GaudiMistralForCausalLM, GaudiMistralModel, MistralConfig, gaudi_mistral_rmsnorm_forward, ) from .mixtral import ( GaudiMixtralAttention, GaudiMixtralDecoderLayer, GaudiMixtralForCausalLM, GaudiMixtralModel, GaudiMixtralSparseMoeBlock, MixtralConfig, gaudi_mixtral_rmsnorm_forward, ) from .mllama import ( GaudiMllamaCrossAttentionDecoderLayer, GaudiMllamaForCausalLM, GaudiMllamaForConditionalGeneration, GaudiMllamaSelfAttentionDecoderLayer, GaudiMllamaTextCrossAttention, GaudiMllamaTextModel, GaudiMllamaTextSelfAttention, GaudiMllamaVisionEncoder, GaudiMllamaVisionEncoderLayer, GaudiMllamaVisionModel, GaudiMllamaVisionSdpaAttention, ) from .modeling_all_models import ( KVCache, Matmul, apply_customized_rope_module, gaudi_check_and_enable_sdpa, gaudi_conv1d_forward, gaudi_get_extended_attention_mask, gaudi_invert_attention_mask, ) from .mpt import ( GaudiMptAttention, GaudiMptBlock, GaudiMptForCausalLM, GaudiMptModel, ) from .opt import ( GaudiOPTDecoderLayer, GaudiOPTForCausalLM, GaudiOPTLearnedPositionalEmbedding, gaudi_opt_attention_forward, gaudi_opt_decoder_forward, gaudi_opt_model_forward, ) from .owlvit import gaudi_owlvitclasspredictionhead_forward from .paligemma import GaudiPaliGemmaForConditionalGeneration from .persimmon import ( GaudiPersimmonAttention, GaudiPersimmonDecoderLayer, GaudiPersimmonForCausalLM, gaudi_persimmon_model_forward, ) from .phi import ( GaudiPhiAttention, GaudiPhiDecoderLayer, GaudiPhiForCausalLM, GaudiPhiModel, ) from .qwen2 import ( GaudiQwen2Attention, GaudiQwen2DecoderLayer, GaudiQwen2ForCausalLM, GaudiQwen2MLP, GaudiQwen2Model, gaudi_qwen2_rmsnorm_forward, ) from .qwen2_moe import ( GaudiQwen2MoeAttention, GaudiQwen2MoeDecoderLayer, GaudiQwen2MoeForCausalLM, GaudiQwen2MoeMLP, GaudiQwen2MoeModel, gaudi_qwen2moe_block_sparse_moe_forward, gaudi_qwen2moe_rmsnorm_forward, ) from .qwen2_vl import ( GaudiQwen2VisionTransformerPretrainedModel, GaudiQwen2VLDecoderLayer, GaudiQwen2VLForConditionalGeneration, GaudiQwen2VLModel, GaudiQwen2VLSdpaAttention, GaudiQwen2VLVisionBlock, GaudiVisionSdpaAttention, ) from .seamless_m4t import ( gaudi_SeamlessM4TAttention_forward, gaudi_SeamlessM4TCodeHifiGan_get_output_hifigan_lengths, gaudi_SeamlessM4TDecoder_forward, gaudi_SeamlessM4TDecoderLayer_forward, gaudi_SeamlessM4TForTextToSpeech_forward, gaudi_SeamlessM4TForTextToSpeech_generate, gaudi_SeamlessM4TForTextToSpeech_prepare_inputs_for_generation, gaudi_SeamlessM4TTextToUnitForConditionalGeneration_forward, gaudi_SeamlessM4TTextToUnitForConditionalGeneration_prepare_inputs_for_generation, gaudi_SeamlessM4TTextToUnitModel_forward, ) from .siglip import ( GaudiSiglipAttention, GaudiSiglipEncoder, GaudiSiglipEncoderLayer, GaudiSiglipVisionEmbeddings, GaudiSiglipVisionModel, GaudiSiglipVisionTransformer, ) from .speecht5 import ( gaudi_generate_speech, gaudi_SpeechT5Attention_forward, gaudi_SpeechT5Decoder_forward, gaudi_SpeechT5DecoderLayer_forward, ) from .stablelm import ( GaudiStableLmAttention, GaudiStableLmDecoderLayer, GaudiStableLmForCausalLM, gaudi_stablelm_model_forward, ) from .starcoder2 import ( GaudiStarcoder2Attention, GaudiStarcoder2DecoderLayer, GaudiStarcoder2ForCausalLM, GaudiStarcoder2Model, ) from .t5 import ( gaudi_t5_layernorm_forward, gaudi_T5Attention_forward, gaudi_T5Block_forward, gaudi_T5ForConditionalGeneration_forward, gaudi_T5ForConditionalGeneration_prepare_inputs_for_generation, gaudi_T5LayerSelfAttention_forward, gaudi_T5Stack_forward, ) from .table_transformer import gaudi_table_transformer_conv_encoder_forward from .video_llava import GaudiVideoLlavaForConditionalGeneration, GaudiVideoLlavaProcessor from .vision_encoder_decoder import ( gaudi_VisionEncoderDecoderModel_prepare_inputs_for_generation, ) from .vit import gaudi_vit_self_attention_forward from .vits import gaudi_unconstrained_rational_quadratic_spline from .wav2vec2 import ( GaudiWav2Vec2SdpaAttention, _gaudi_wav2vec2_compute_mask_indices, _gaudi_wav2vec2_mask_hidden_states, _gaudi_wav2vec2_sample_negative_indices, gaudi_wav2vec2_encoder_forward, gaudi_wav2vec2_forward, gaudi_wav2vec2_tdnnlayer_forward, gaudi_wav2vec2forctc_forward, ) from .whisper import ( GAUDI_WHISPER_ATTENTION_CLASSES, GaudiWhisperDecoder, GaudiWhisperDecoderLayer, GaudiWhisperForConditionalGeneration, GaudiWhisperModel, GaudiWhisperSdpaAttention, ) from .xglm import ( GaudiXGLMForCausalLM, gaudi_xglm_attention_forward, gaudi_xglm_decoder_layer_forward, gaudi_xglm_model_forward, ) from .xlm_roberta import gaudi_XLMRoberta_Sdpa_SelfAttention_forward