o
    ZhkQ                    @   sT  d Z ddlZddlmZ ddlmZ ddlmZmZm	Z	m
Z
 ddlmZ eeZeg d	Zeg d
Zeg dZeg dZeg dZeg dZedgZeg dZedgZeg dZedgZeg dZeg dZeg dZedgZeg dZeg dZ eg dZ!eg dZ"eg dZ#eg dZ$eg dZ%eg dZ&eg d Z'ed!gZ(eg d"Z)eg d#Z*eg d$Z+eg d%Z,eg d&Z-eg d'Z.eg d(Z/eg d)Z0eg d*Z1ed+d,gZ2eg d-Z3eg d.Z4eg d/Z5ed0gZ6ed1gZ6ed2gZ7eg d3Z8ed4d5gZ9ed6d7gZ:ed8gZ;ed9gZ<e	eeZ=e	eeZ>e	eeZ?e	eeZ@e	eeZAe	eeZBe	ee4ZCe	eeZDe	eeZEe	eeZFe	eeZGe	eeZHe	eeZIe	eeZJe	eeZKe	ee)ZLe	ee*ZMe	ee ZNe	eeZOe	eeZPe	ee!ZQe	ee"ZRe	ee#ZSe	ee$ZTe	ee&ZUe	ee'ZVe	ee(ZWe	ee+ZXe	ee,ZYe	ee-ZZe	ee.Z[e	ee/Z\e	ee%Z]e	ee0Z^e	ee1Z_e	ee2Z`e	ee3Zae	ee5Zbe	ee6Zce	ee7Zde	ee8Zee	ee9Zfe	ee:Zge	ee;Zhe	ee<ZiG d:d; d;eZjG d<d= d=eZkG d>d? d?eZlG d@dA dAeZmG dBdC dCeZne
enZnG dDdE dEeZoe
eodFdGZoG dHdI dIeZpe
epdJdGZpG dKdL dLeZqe
eqdMdGZqG dNdO dOeZre
erdPdGZrG dQdR dReZse
esdSdTdUZsG dVdW dWeZte
etdXdGZtG dYdZ dZeZue
eud[dGZuG d\d] d]eZve
evd^d_dUZvG d`da daeZwe
ewdbdcdUZwG ddde deeZxe
exdfdgdUZxG dhdi dieZye
eydjdGZyG dkdl dleZze
ezdmdGZzG dndo doeZ{e
e{dpdGZ{G dqdr dreZ|e
e|dsdGZ|G dtdu dueZ}e
e}dvdGZ}G dwdx dxeZ~e
e~dydGZ~G dzd{ d{eZe
ed|dGZG d}d~ d~eZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZe
eddGZG dd deZG dd deZG dd deZG dd deZe
eddGZG dd deZe
eddGZG dd depZg dZdS )zAuto Model class.    N)OrderedDict   )logging   )_BaseAutoBackboneClass_BaseAutoModelClass_LazyAutoMappingauto_class_update)CONFIG_MAPPING_NAMES(?  albertZAlbertModelalignZ
AlignModelZaltclipZAltCLIPModel)ariaZ	AriaModel)	aria_textZAriaTextModel)audio-spectrogram-transformerZASTModel)Z
autoformerZAutoformerModel)
aya_visionZAyaVisionModel)bambaZ
BambaModelZbarkZ	BarkModel)bartZ	BartModelbeitZ	BeitModelbertZ	BertModel)bert-generationZBertGenerationEncoderbig_birdZBigBirdModel)bigbird_pegasusZBigBirdPegasusModel)biogptZBioGptModelbitZBitModel)bitnetZBitNetModel)
blenderbotZBlenderbotModel)blenderbot-smallZBlenderbotSmallModelblipZ	BlipModel)blip-2Z
Blip2Model)Zblip_2_qformerZBlip2QFormerModel)bloomZ
BloomModel)ZbridgetowerZBridgeTowerModel)brosZ	BrosModel)	camembertZCamembertModel)canineZCanineModel)	chameleonZChameleonModelZchinese_clipZChineseCLIPModel)Zchinese_clip_vision_modelZChineseCLIPVisionModel)clapZ	ClapModelclipZ	CLIPModelZclip_text_modelZCLIPTextModel)Zclip_vision_modelZCLIPVisionModelZclipsegZCLIPSegModel)ZclvpZ!ClvpModelForConditionalGeneration)
code_llama
LlamaModel)codegenZCodeGenModel)cohereZCohereModel)cohere2ZCohere2Modelconditional_detrZConditionalDetrModel)convbertZConvBertModelconvnextZConvNextModel
convnextv2ZConvNextV2Model)cpmantZCpmAntModelZcsmZCsmForConditionalGeneration)ctrlZ	CTRLModel)cvtZCvtModel)d_fineZ
DFineModeldab-detrZDabDetrModel)ZdacZDacModel)data2vec-audioZData2VecAudioModeldata2vec-textZData2VecTextModeldata2vec-visionZData2VecVisionModel)dbrxZ	DbrxModeldebertaZDebertaModel
deberta-v2ZDebertaV2Model)Zdecision_transformerZDecisionTransformerModel)deepseek_v3ZDeepseekV3Modeldeformable_detrZDeformableDetrModeldeitZ	DeiTModel	depth_proZDepthProModeldetaZ	DetaModeldetrZ	DetrModel)	diffllamaZDiffLlamaModeldinatZ
DinatModeldinov2ZDinov2Modeldinov2_with_registersZDinov2WithRegistersModel
distilbertZDistilBertModel)
donut-swinZDonutSwinModel)ZdprZDPRQuestionEncoderdptZDPTModelefficientformerZEfficientFormerModelefficientnetZEfficientNetModelelectraZElectraModel)emu3Z	Emu3Model)ZencodecZEncodecModel)ernieZ
ErnieModel)ernie_mZErnieMModel)esmZEsmModel)falconZFalconModel)falcon_mambaZFalconMambaModelfastspeech2_conformerZFastSpeech2ConformerModelflaubertZFlaubertModel)flavaZ
FlavaModel)fnetZ	FNetModelfocalnetZFocalNetModel)fsmtZ	FSMTModel)funnel)ZFunnelModelZFunnelBaseModel)fuyuZ	FuyuModel)gemmaZ
GemmaModel)gemma2ZGemma2Model)gemma3ZGemma3Model)gemma3_textZGemma3TextModel)gitZGitModel)glmZGlmModel)glm4Z	Glm4ModelglpnZ	GLPNModel)got_ocr2ZGotOcr2Model)gpt-sw3	GPT2Model)gpt2r   )gpt_bigcodeZGPTBigCodeModel)gpt_neoZGPTNeoModel)gpt_neoxZGPTNeoXModel)gpt_neox_japaneseZGPTNeoXJapaneseModel)gptjZ	GPTJModelzgptsan-japaneseZ&GPTSanJapaneseForConditionalGeneration)graniteZGraniteModel)
granitemoeZGraniteMoeModel)granitemoehybridZGraniteMoeHybridModel)granitemoesharedZGraniteMoeSharedModel)Z
graphormerZGraphormerModel)grounding-dinoZGroundingDinoModel)ZgroupvitZGroupViTModel)heliumZHeliumModelhgnet_v2ZHGNetV2BackbonehieraZ
HieraModel)hubertZHubertModelibertZ
IBertModel)ideficsZIdeficsModel)idefics2ZIdefics2Model)idefics3ZIdefics3Model)Zidefics3_visionZIdefics3VisionTransformerijepaZ
IJepaModelimagegptZImageGPTModel)ZinformerZInformerModel)instructblipZInstructBlipModel)instructblipvideoZInstructBlipVideoModel)internvlZInternVLModel)Zinternvl_visionZInternVLVisionModel)jambaZ
JambaModel)janusZ
JanusModel)jetmoeZJetMoeModel)ZjukeboxZJukeboxModel)kosmos-2ZKosmos2Model)layoutlmZLayoutLMModel)
layoutlmv2ZLayoutLMv2Model)
layoutlmv3ZLayoutLMv3Model)ledZLEDModellevitZ
LevitModel)liltZ	LiltModel)llamar4   llama4ZLlama4ForConditionalGeneration)llama4_textLlama4TextModel)llavaZ
LlavaModel)
llava_nextZLlavaNextModel)llava_next_videoZLlavaNextVideoModel)llava_onevisionZLlavaOnevisionModel
longformerZLongformerModel)longt5ZLongT5Model)lukeZ	LukeModel)lxmertZLxmertModel)m2m_100ZM2M100Model)mambaZ
MambaModel)mamba2ZMamba2Model)marianZMarianModel)markuplmZMarkupLMModel)mask2formerZMask2FormerModel)
maskformerZMaskFormerModel)maskformer-swinZMaskFormerSwinModel)mbartZ
MBartModel)mctctZ
MCTCTModel)megaZ	MegaModel)megatron-bertZMegatronBertModel)zmgp-strZMgpstrForSceneTextRecognition)ZmimiZ	MimiModel)mistralZMistralModel)mistral3ZMistral3Model)mixtralZMixtralModelZmlcdZMLCDVisionModel)mllamaZMllamaModel
mobilebertZMobileBertModelmobilenet_v1ZMobileNetV1Modelmobilenet_v2ZMobileNetV2Model	mobilevitZMobileViTModelmobilevitv2ZMobileViTV2Model)
modernbertZModernBertModel)	moonshineZMoonshineModel)moshiZ
MoshiModel)mpnetZ
MPNetModel)mptZMptModel)mraZMraModel)mt5ZMT5Model)musicgenZMusicgenModel)musicgen_melodyZMusicgenMelodyModel)mvpZMvpModelnatZNatModel)nemotronZNemotronModel)nezhaZ
NezhaModel)nllb-moeZNllbMoeModelnystromformerZNystromformerModel)olmoZ	OlmoModel)olmo2Z
Olmo2Model)olmoeZ
OlmoeModelzomdet-turboZOmDetTurboForObjectDetection)	oneformerZOneFormerModel)
open-llamaZOpenLlamaModel)
openai-gptZOpenAIGPTModel)optZOPTModel)owlv2Z
Owlv2Model)owlvitZOwlViTModel)	paligemmaZPaliGemmaModel)patchtsmixerZPatchTSMixerModel)patchtstZPatchTSTModel)pegasusZPegasusModel)	pegasus_xZPegasusXModel)	perceiverZPerceiverModel)	persimmonZPersimmonModel)phiZPhiModel)phi3Z	Phi3Model)phi4_multimodalZPhi4MultimodalModel)phimoeZPhimoeModel)pixtralZPixtralVisionModel)plbartZPLBartModel
poolformerZPoolFormerModel)
prophetnetZProphetNetModelpvtZPvtModel)pvt_v2Z
PvtV2Model)qdqbertZQDQBertModel)qwen2Z
Qwen2Model)
qwen2_5_vlZQwen2_5_VLModel)Zqwen2_5_vl_textZQwen2_5_VLTextModel)Zqwen2_audio_encoderZQwen2AudioEncoder)	qwen2_moeZQwen2MoeModel)qwen2_vlZQwen2VLModel)Zqwen2_vl_textZQwen2VLTextModel)qwen3Z
Qwen3Model)	qwen3_moeZQwen3MoeModel)recurrent_gemmaZRecurrentGemmaModelreformerZReformerModelregnetZRegNetModelrembertZRemBertModelresnetZResNetModelZ	retribertZRetriBertModelrobertaZRobertaModelroberta-prelayernormZRobertaPreLayerNormModelroc_bertZRoCBertModelroformerZRoFormerModel)rt_detrZRTDetrModel)
rt_detr_v2ZRTDetrV2Model)rwkvZ	RwkvModelZsamZSamModelZsam_hqZ
SamHQModel)Zsam_hq_vision_modelZSamHQVisionModel)Zsam_vision_modelZSamVisionModel)seamless_m4tZSeamlessM4TModel)seamless_m4t_v2ZSeamlessM4Tv2Model	segformerZSegformerModel)ZseggptZSegGptModel)sewZSEWModel)sew-dZ	SEWDModelsiglipZSiglipModelsiglip2ZSiglip2ModelZsiglip_vision_modelZSiglipVisionModel)smolvlmZSmolVLMModel)Zsmolvlm_visionZSmolVLMVisionTransformer)speech_to_textZSpeech2TextModel)speecht5ZSpeechT5Model)splinterZSplinterModelsqueezebertZSqueezeBertModel)stablelmZStableLmModel)
starcoder2ZStarcoder2Model)Z	superglueZSuperGlueForKeypointMatchingswiftformerZSwiftFormerModelswinZ	SwinModelswin2srZSwin2SRModelswinv2ZSwinv2Model)switch_transformersZSwitchTransformersModel)t5ZT5Modeltable-transformerZTableTransformerModel)tapasZ
TapasModel)textnetZTextNetModel)Ztime_series_transformerZTimeSeriesTransformerModel)timesfmZTimesFmModeltimesformerZTimesformerModelZtimm_backboneZTimmBackbonetimm_wrapperZTimmWrapperModel)Ztrajectory_transformerZTrajectoryTransformerModel)
transfo-xlZTransfoXLModel)tvltZ	TvltModel)ZtvpZTvpModel)udopZ	UdopModel)umt5Z	UMT5Model)	unispeechZUniSpeechModel)unispeech-satZUniSpeechSatModel)ZunivnetZUnivNetModelvanZVanModel)video_llavaZVideoLlavaModelvideomaeZVideoMAEModel)viltZ	ViltModel)vipllavaZVipLlavaModel)zvision-text-dual-encoderZVisionTextDualEncoderModel)visual_bertZVisualBertModelvitZViTModel
vit_hybridZViTHybridModelvit_maeZViTMAEModelvit_msnZViTMSNModelvitdetZVitDetModelZvitsZ	VitsModelvivitZ
VivitModel)wav2vec2ZWav2Vec2Model)wav2vec2-bertZWav2Vec2BertModel)wav2vec2-conformerZWav2Vec2ConformerModel)wavlmZ
WavLMModel)whisperZWhisperModel)ZxclipZ
XCLIPModel)xglmZ	XGLMModelxlmZXLMModel)xlm-prophetnetZXLMProphetNetModelxlm-robertaZXLMRobertaModelxlm-roberta-xlZXLMRobertaXLModel)xlnetZ
XLNetModel)xmodZ	XmodModelyolosZ
YolosModel)yosoZ	YosoModel)zambaZ
ZambaModel)zamba2ZZamba2Model)Q)r   ZAlbertForPreTrainingr   ZBartForConditionalGeneration)r   ZBertForPreTraining)r   ZBigBirdForPreTrainingr(   ZBloomForCausalLMr*   ZCamembertForMaskedLMZcolpaliZColPaliForRetrievalrA   ZCTRLLMHeadModelrH   ZData2VecTextForMaskedLMrM   ZDebertaForMaskedLMrO   ZDebertaV2ForMaskedLMrc   ZDistilBertForMaskedLM)rl   ZElectraForPreTraining)rn   ZErnieForPreTrainingrr   ZFalconMambaForCausalLMrv   ZFlaubertWithLMHeadModel)rw   ZFlavaForPreTraining)rx   ZFNetForPreTrainingr{   ZFSMTForConditionalGeneration)r|   ZFunnelForPreTrainingr   Gemma3ForConditionalGenerationr   GPT2LMHeadModelr   r  r   ZGPTBigCodeForCausalLMr   )r   ZHieraForPreTrainingr   ZIBertForMaskedLMr   ZIdeficsForVisionText2Textr   Z Idefics2ForConditionalGenerationr   Z Idefics3ForConditionalGenerationr   ZJanusForConditionalGenerationr   ZLayoutLMForMaskedLMr   LlavaForConditionalGenerationr   Z!LlavaNextForConditionalGenerationr   Z&LlavaNextVideoForConditionalGenerationr   Z&LlavaOnevisionForConditionalGenerationr   ZLongformerForMaskedLMr   ZLukeForMaskedLM)r   ZLxmertForPreTrainingr   ZMambaForCausalLMr   ZMamba2ForCausalLMr   ZMegaForMaskedLM)r   ZMegatronBertForPreTrainingr   Z Mistral3ForConditionalGenerationr   ZMllamaForConditionalGeneration)r   ZMobileBertForPreTrainingr   ZMPNetForMaskedLMr   ZMptForCausalLMr   ZMraForMaskedLMr   ZMvpForConditionalGeneration)r   ZNezhaForPreTrainingr   ZNllbMoeForConditionalGenerationr   ZOpenAIGPTLMHeadModelr   Z!PaliGemmaForConditionalGenerationZqwen2_audioZ"Qwen2AudioForConditionalGenerationr  r  ZRobertaForMaskedLMr  ZRobertaPreLayerNormForMaskedLM)r   ZRoCBertForPreTrainingr%  ZRwkvForCausalLM)r6  ZSplinterForPreTrainingr8  ZSqueezeBertForMaskedLMrC  Z*SwitchTransformersForConditionalGenerationrD  ZT5ForConditionalGenerationrG  ZTapasForMaskedLMrO  ZTransfoXLLMHeadModel)rP  ZTvltForPreTraining)rS  ZUniSpeechForPreTraining)rT  ZUniSpeechSatForPreTrainingrW  Z"VideoLlavaForConditionalGeneration)rY  ZVideoMAEForPreTrainingr[  Z VipLlavaForConditionalGeneration)r\  ZVisualBertForPreTraining)rb  ZViTMAEForPreTraining)rj  ZWav2Vec2ForPreTraining)rl  ZWav2Vec2ConformerForPreTrainingrq  ZXLMWithLMHeadModelrt  ZXLMRobertaForMaskedLMrv  ZXLMRobertaXLForMaskedLMrw  ZXLNetLMHeadModelrx  ZXmodForMaskedLM)Qr   ZAlbertForMaskedLMr~  r   ZBertForMaskedLMr   ZBigBirdForMaskedLMr   Z&BigBirdPegasusForConditionalGenerationr$   Z'BlenderbotSmallForConditionalGenerationr  r  r5   ZCodeGenForCausalLMr:   ZConvBertForMaskedLMr?   ZCpmAntForCausalLMr  r  r  r  r  rl   ZElectraForMaskedLMzencoder-decoderZEncoderDecoderModelrn   ZErnieForMaskedLMrp   ZEsmForMaskedLMr  r  rx   ZFNetForMaskedLMr  r|   ZFunnelForMaskedLMr   ZGitForCausalLMr  r  r  r   ZGPTNeoForCausalLMr   ZGPTNeoXForCausalLMr   ZGPTNeoXJapaneseForCausalLMr   ZGPTJForCausalLMr   r  r  r   ZLEDForConditionalGenerationr  r   ZLongT5ForConditionalGenerationr  r   ZM2M100ForConditionalGenerationr  r  r   ZMarianMTModelr  r   ZMegatronBertForCausalLMr   ZMobileBertForMaskedLMr   Z!MoonshineForConditionalGenerationr  r  r  r  r   ZNezhaForMaskedLMr  r   ZNystromformerForMaskedLMr  r   Z PegasusXForConditionalGenerationr  ZPLBartForConditionalGenerationZ	pop2pianoZ!Pop2PianoForConditionalGenerationr
  ZQDQBertForMaskedLMr  ZReformerModelWithLMHeadr  ZRemBertForMaskedLMr  r  r   ZRoCBertForMaskedLMr"  ZRoFormerForMaskedLMr  r4  Z#Speech2TextForConditionalGenerationr  r  r  r  r  rj  ZWav2Vec2ForMaskedLMrn  ZWhisperForConditionalGenerationr  r  r  r  r  r{  ZYosoForMaskedLM)o)r   ZAriaTextForCausalLM)r   ZBambaForCausalLM)r   ZBartForCausalLM)r   ZBertLMHeadModel)r   ZBertGenerationDecoder)r   ZBigBirdForCausalLM)r   ZBigBirdPegasusForCausalLM)r   ZBioGptForCausalLM)r"   ZBitNetForCausalLM)r#   ZBlenderbotForCausalLM)r$   ZBlenderbotSmallForCausalLMr  )r*   ZCamembertForCausalLM)r3   LlamaForCausalLMr  )r6   ZCohereForCausalLM)r7   ZCohere2ForCausalLMr  r  )rH   ZData2VecTextForCausalLM)rK   ZDbrxForCausalLM)rP   ZDeepseekV3ForCausalLM)r[   ZDiffLlamaForCausalLM)rl   ZElectraForCausalLM)rm   ZEmu3ForCausalLM)rn   ZErnieForCausalLM)rq   ZFalconForCausalLMr  r}   ZFuyuForCausalLM)r~   ZGemmaForCausalLM)r   ZGemma2ForCausalLMr  )r   ZGemma3ForCausalLMr  )r   ZGlmForCausalLM)r   ZGlm4ForCausalLMr   ZGotOcr2ForConditionalGenerationr  r  r  r  r  r  r  )r   ZGraniteForCausalLM)r   ZGraniteMoeForCausalLM)r   ZGraniteMoeHybridForCausalLM)r   ZGraniteMoeSharedForCausalLM)r   ZHeliumForCausalLM)r   ZJambaForCausalLM)r   ZJetMoeForCausalLM)r   r  )r   Llama4ForCausalLM)r   r  r  r  )r   ZMarianForCausalLM)r   ZMBartForCausalLM)r   ZMegaForCausalLMr  )r   ZMistralForCausalLM)r   ZMixtralForCausalLM)r   ZMllamaForCausalLM)r   ZMoshiForCausalLMr  )r   ZMusicgenForCausalLM)r   ZMusicgenMelodyForCausalLM)r   ZMvpForCausalLM)r   ZNemotronForCausalLM)r   ZOlmoForCausalLM)r   ZOlmo2ForCausalLM)r   ZOlmoeForCausalLM)r   ZOpenLlamaForCausalLMr  )r   ZOPTForCausalLM)r   ZPegasusForCausalLM)r   ZPersimmonForCausalLM)r   ZPhiForCausalLM)r   ZPhi3ForCausalLM)r   ZPhi4MultimodalForCausalLM)r  ZPhimoeForCausalLM)r  ZPLBartForCausalLM)r  ZProphetNetForCausalLM)r
  ZQDQBertLMHeadModel)r  ZQwen2ForCausalLM)r  ZQwen2MoeForCausalLM)r  ZQwen3ForCausalLM)r  ZQwen3MoeForCausalLM)r  ZRecurrentGemmaForCausalLMr  )r  ZRemBertForCausalLM)r  ZRobertaForCausalLM)r  ZRobertaPreLayerNormForCausalLM)r   ZRoCBertForCausalLM)r"  ZRoFormerForCausalLMr  )Zspeech_to_text_2ZSpeech2Text2ForCausalLM)r9  ZStableLmForCausalLM)r:  ZStarcoder2ForCausalLMr  )ZtrocrZTrOCRForCausalLM)rn  ZWhisperForCausalLM)ro  ZXGLMForCausalLMr  )rr  ZXLMProphetNetForCausalLM)rt  ZXLMRobertaForCausalLM)rv  ZXLMRobertaXLForCausalLMr  )rx  ZXmodForCausalLM)r|  ZZambaForCausalLM)r}  ZZamba2ForCausalLM)7r   r    r8   r;   r=   rD   rI   rQ   rS   rU   rW   rY   r\   r^   r`   re   rg   ri   ry   r   r   r   r   r   )r   ZLlama4VisionModelr   )r   ZMllamaVisionModelr   r   r   r   r   r  r  r  r  r*  r2  r;  r=  r?  rA  rE  rJ  rL  rM  rU  rX  r]  r_  ra  rc  re  rh  ry  ))rT   ZDeiTForMaskedImageModeling)rz   ZFocalNetForMaskedImageModeling)r>  ZSwinForMaskedImageModeling)rB  ZSwinv2ForMaskedImageModeling)r^  ZViTForMaskedImageModeling)r   ZImageGPTForCausalImageModeling),)r   ZBeitForImageClassification)r!   ZBitForImageClassification)r0   ZCLIPForImageClassification)r<   ZConvNextForImageClassification)r>   Z ConvNextV2ForImageClassification)rB   ZCvtForImageClassification)rJ   Z$Data2VecVisionForImageClassification)rT   )ZDeiTForImageClassificationZ%DeiTForImageClassificationWithTeacher)r]   ZDinatForImageClassification)r_   ZDinov2ForImageClassification)ra   Z)Dinov2WithRegistersForImageClassification)rd   ZDonutSwinForImageClassification)rh   )Z%EfficientFormerForImageClassificationZ0EfficientFormerForImageClassificationWithTeacher)rj   Z"EfficientNetForImageClassification)rz   ZFocalNetForImageClassification)r   ZHGNetV2ForImageClassification)r   ZHieraForImageClassification)r   ZIJepaForImageClassification)r   ZImageGPTForImageClassification)r   )ZLevitForImageClassificationZ&LevitForImageClassificationWithTeacher)r   Z!MobileNetV1ForImageClassification)r   Z!MobileNetV2ForImageClassification)r   ZMobileViTForImageClassification)r   Z!MobileViTV2ForImageClassification)r   ZNatForImageClassification)r   )Z&PerceiverForImageClassificationLearnedZ&PerceiverForImageClassificationFourierZ-PerceiverForImageClassificationConvProcessing)r  Z PoolFormerForImageClassification)r  ZPvtForImageClassification)r	  ZPvtV2ForImageClassification)r  ZRegNetForImageClassification)r  ZResNetForImageClassification)r+  ZSegformerForImageClassification)shieldgemma2Z"ShieldGemma2ForImageClassification)r/  ZSiglipForImageClassification)r1  ZSiglip2ForImageClassification)r<  Z!SwiftFormerForImageClassification)r>  ZSwinForImageClassification)rB  ZSwinv2ForImageClassification)rH  ZTextNetForImageClassification)rN  Z!TimmWrapperForImageClassification)rV  ZVanForImageClassification)r^  ZViTForImageClassification)r`  ZViTHybridForImageClassification)rd  ZViTMSNForImageClassificationrZ   ZDetrForSegmentation))r   ZBeitForSemanticSegmentation)rJ   Z%Data2VecVisionForSemanticSegmentation)rf   ZDPTForSemanticSegmentation)r   Z"MobileNetV2ForSemanticSegmentation)r   Z MobileViTForSemanticSegmentation)r   Z"MobileViTV2ForSemanticSegmentation)r+  Z SegformerForSemanticSegmentation)ZupernetZUperNetForSemanticSegmentationr   Z!MaskFormerForInstanceSegmentation)r  )r   Z#Mask2FormerForUniversalSegmentationr  )r   Z!OneFormerForUniversalSegmentation))rK  Z!TimesformerForVideoClassification)rY  ZVideoMAEForVideoClassification)ri  ZVivitForVideoClassification)r&   ZBlipForConditionalGenerationr'   ZBlip2ForConditionalGenerationr,   Z!ChameleonForConditionalGenerationr  r  r  r   Z$InstructBlipForConditionalGeneration)r   Z)InstructBlipVideoForConditionalGenerationr   ZKosmos2ForConditionalGenerationr  r  r  r  r  r  r  Z
pix2structZ"Pix2StructForConditionalGenerationr  Z"Qwen2_5_VLForConditionalGenerationr  ZQwen2VLForConditionalGenerationr  r  zvision-encoder-decoderZVisionEncoderDecoderModelr  )")r   ZAriaForConditionalGeneration)r   Z!AyaVisionForConditionalGenerationr  r  r  )rm   ZEmu3ForConditionalGenerationr  r  r  r  r  r  r  r  )r   Z InternVLForConditionalGenerationr  r  r   r  r  r  r  r  r  r  r  )r  r  r  r  )r  r  )r3  ZSmolVLMForConditionalGeneration)rQ  ZUdopForConditionalGenerationr  r  ).r  r~  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r   ZMBartForConditionalGenerationr  )r   ZMegatronBertForMaskedLMr  )r   ZModernBertForMaskedLMr  r  r  r  r  )r   ZPerceiverForMaskedLMr  )r  ZReformerForMaskedLMr  r  r  r  r  r  r  r  r  r  r  r  r  )
)r9   Z!ConditionalDetrForObjectDetection)rC   ZDFineForObjectDetection)rE   ZDabDetrForObjectDetection)rR   Z DeformableDetrForObjectDetection)rX   ZDetaForObjectDetection)rZ   ZDetrForObjectDetection)r#  ZRTDetrForObjectDetection)r$  ZRTDetrV2ForObjectDetection)rF  Z"TableTransformerForObjectDetection)rz  ZYolosForObjectDetection))r   ZGroundingDinoForObjectDetectionr   )r   ZOwlv2ForObjectDetection)r   ZOwlViTForObjectDetection))Zdepth_anythingZDepthAnythingForDepthEstimation)rV   ZDepthProForDepthEstimation)rf   ZDPTForDepthEstimation)r   ZGLPNForDepthEstimation)Zprompt_depth_anythingZ%PromptDepthAnythingForDepthEstimation)ZzoedepthZZoeDepthForDepthEstimation)r~  r  )r#   Z"BlenderbotForConditionalGenerationr  r  r  r   Zgranite_speechZ%GraniteSpeechForConditionalGenerationr  r  r  r  r  )r   ZMT5ForConditionalGenerationr  r  )r   ZPegasusForConditionalGenerationr  r  )r  Z"ProphetNetForConditionalGenerationr  )r(  ZSeamlessM4TForTextToText)r)  ZSeamlessM4Tv2ForTextToTextr  r  )rR  ZUMT5ForConditionalGeneration)rr  Z%XLMProphetNetForConditionalGeneration)	r  r  r  )r(  ZSeamlessM4TForSpeechToText)r)  ZSeamlessM4Tv2ForSpeechToText)zspeech-encoder-decoderZSpeechEncoderDecoderModelr  )r5  ZSpeechT5ForSpeechToTextr  )b)r   ZAlbertForSequenceClassification)r   ZBartForSequenceClassification)r   ZBertForSequenceClassification)r   Z BigBirdForSequenceClassification)r   Z'BigBirdPegasusForSequenceClassification)r   ZBioGptForSequenceClassification)r(   ZBloomForSequenceClassification)r*   Z"CamembertForSequenceClassification)r+   ZCanineForSequenceClassification)r3   LlamaForSequenceClassification)r:   Z!ConvBertForSequenceClassification)rA   ZCTRLForSequenceClassification)rH   Z%Data2VecTextForSequenceClassification)rM   Z DebertaForSequenceClassification)rO   Z"DebertaV2ForSequenceClassification)r[   Z"DiffLlamaForSequenceClassification)rc   Z#DistilBertForSequenceClassification)rl   Z ElectraForSequenceClassification)rn   ZErnieForSequenceClassification)ro   ZErnieMForSequenceClassification)rp   ZEsmForSequenceClassification)rq   ZFalconForSequenceClassification)rv   Z!FlaubertForSequenceClassification)rx   ZFNetForSequenceClassification)r|   ZFunnelForSequenceClassification)r~   ZGemmaForSequenceClassification)r   ZGemma2ForSequenceClassification)r   ZGlmForSequenceClassification)r   ZGlm4ForSequenceClassification)r   GPT2ForSequenceClassification)r   r  )r   Z#GPTBigCodeForSequenceClassification)r   ZGPTNeoForSequenceClassification)r   Z GPTNeoXForSequenceClassification)r   ZGPTJForSequenceClassification)r   ZHeliumForSequenceClassification)r   ZIBertForSequenceClassification)r   ZJambaForSequenceClassification)r   ZJetMoeForSequenceClassification)r   Z!LayoutLMForSequenceClassification)r   Z#LayoutLMv2ForSequenceClassification)r   Z#LayoutLMv3ForSequenceClassification)r   ZLEDForSequenceClassification)r   ZLiltForSequenceClassification)r   r  )r   Z#LongformerForSequenceClassification)r   ZLukeForSequenceClassification)r   Z!MarkupLMForSequenceClassification)r   ZMBartForSequenceClassification)r   ZMegaForSequenceClassification)r   Z%MegatronBertForSequenceClassification)r   Z MistralForSequenceClassification)r   Z MixtralForSequenceClassification)r   Z#MobileBertForSequenceClassification)r   Z#ModernBertForSequenceClassification)r   ZMPNetForSequenceClassification)r   ZMptForSequenceClassification)r   ZMraForSequenceClassification)r   ZMT5ForSequenceClassification)r   ZMvpForSequenceClassification)r   Z!NemotronForSequenceClassification)r   ZNezhaForSequenceClassification)r   Z&NystromformerForSequenceClassification)r   Z"OpenLlamaForSequenceClassification)r   Z"OpenAIGPTForSequenceClassification)r   ZOPTForSequenceClassification)r   Z"PerceiverForSequenceClassification)r   Z"PersimmonForSequenceClassification)r   ZPhiForSequenceClassification)r   ZPhi3ForSequenceClassification)r  ZPhimoeForSequenceClassification)r  ZPLBartForSequenceClassification)r
  Z QDQBertForSequenceClassification)r  ZQwen2ForSequenceClassification)r  Z!Qwen2MoeForSequenceClassification)r  ZQwen3ForSequenceClassification)r  Z!Qwen3MoeForSequenceClassification)r  Z!ReformerForSequenceClassification)r  Z RemBertForSequenceClassification)r  Z RobertaForSequenceClassification)r  Z,RobertaPreLayerNormForSequenceClassification)r   Z RoCBertForSequenceClassification)r"  Z!RoFormerForSequenceClassification)r8  Z$SqueezeBertForSequenceClassification)r9  Z!StableLmForSequenceClassification)r:  Z#Starcoder2ForSequenceClassification)rD  ZT5ForSequenceClassification)rG  ZTapasForSequenceClassification)rO  Z"TransfoXLForSequenceClassification)rR  ZUMT5ForSequenceClassification)rq  ZXLMForSequenceClassification)rt  Z#XLMRobertaForSequenceClassification)rv  Z%XLMRobertaXLForSequenceClassification)rw  ZXLNetForSequenceClassification)rx  ZXmodForSequenceClassification)r{  ZYosoForSequenceClassification)r|  ZZambaForSequenceClassification)r}  ZZamba2ForSequenceClassification)H)r   ZAlbertForQuestionAnswering)r   ZBartForQuestionAnswering)r   ZBertForQuestionAnswering)r   ZBigBirdForQuestionAnswering)r   Z"BigBirdPegasusForQuestionAnswering)r(   ZBloomForQuestionAnswering)r*   ZCamembertForQuestionAnswering)r+   ZCanineForQuestionAnswering)r:   ZConvBertForQuestionAnswering)rH   Z Data2VecTextForQuestionAnswering)rM   ZDebertaForQuestionAnswering)rO   ZDebertaV2ForQuestionAnswering)r[   ZDiffLlamaForQuestionAnswering)rc   ZDistilBertForQuestionAnswering)rl   ZElectraForQuestionAnswering)rn   ZErnieForQuestionAnswering)ro   ZErnieMForQuestionAnswering)rq   ZFalconForQuestionAnswering)rv   Z"FlaubertForQuestionAnsweringSimple)rx   ZFNetForQuestionAnswering)r|   ZFunnelForQuestionAnswering)r   ZGPT2ForQuestionAnswering)r   ZGPTNeoForQuestionAnswering)r   ZGPTNeoXForQuestionAnswering)r   ZGPTJForQuestionAnswering)r   ZIBertForQuestionAnsweringr   ZLayoutLMv2ForQuestionAnsweringr   ZLayoutLMv3ForQuestionAnswering)r   ZLEDForQuestionAnswering)r   ZLiltForQuestionAnswering)r   ZLlamaForQuestionAnswering)r   ZLongformerForQuestionAnswering)r   ZLukeForQuestionAnswering)r   ZLxmertForQuestionAnswering)r   ZMarkupLMForQuestionAnswering)r   ZMBartForQuestionAnswering)r   ZMegaForQuestionAnswering)r   Z MegatronBertForQuestionAnswering)r   ZMistralForQuestionAnswering)r   ZMixtralForQuestionAnswering)r   ZMobileBertForQuestionAnswering)r   ZModernBertForQuestionAnswering)r   ZMPNetForQuestionAnswering)r   ZMptForQuestionAnswering)r   ZMraForQuestionAnswering)r   ZMT5ForQuestionAnswering)r   ZMvpForQuestionAnswering)r   ZNemotronForQuestionAnswering)r   ZNezhaForQuestionAnswering)r   Z!NystromformerForQuestionAnswering)r   ZOPTForQuestionAnswering)r
  ZQDQBertForQuestionAnswering)r  ZQwen2ForQuestionAnswering)r  ZQwen2MoeForQuestionAnswering)r  ZQwen3ForQuestionAnswering)r  ZQwen3MoeForQuestionAnswering)r  ZReformerForQuestionAnswering)r  ZRemBertForQuestionAnswering)r  ZRobertaForQuestionAnswering)r  Z'RobertaPreLayerNormForQuestionAnswering)r   ZRoCBertForQuestionAnswering)r"  ZRoFormerForQuestionAnswering)r6  ZSplinterForQuestionAnswering)r8  ZSqueezeBertForQuestionAnswering)rD  ZT5ForQuestionAnswering)rR  ZUMT5ForQuestionAnswering)rq  ZXLMForQuestionAnsweringSimple)rt  ZXLMRobertaForQuestionAnswering)rv  Z XLMRobertaXLForQuestionAnswering)rw  ZXLNetForQuestionAnsweringSimple)rx  ZXmodForQuestionAnswering)r{  ZYosoForQuestionAnswering)rG  ZTapasForQuestionAnswering))r&   ZBlipForQuestionAnsweringr  )rZ  ZViltForQuestionAnswering))r   ZLayoutLMForQuestionAnsweringr  r  )N)r   ZAlbertForTokenClassification)r   ZBertForTokenClassification)r   ZBigBirdForTokenClassification)r   ZBioGptForTokenClassification)r(   ZBloomForTokenClassification)r)   ZBrosForTokenClassification)r*   ZCamembertForTokenClassification)r+   ZCanineForTokenClassification)r:   ZConvBertForTokenClassification)rH   Z"Data2VecTextForTokenClassification)rM   ZDebertaForTokenClassification)rO   ZDebertaV2ForTokenClassification)r[   ZDiffLlamaForTokenClassification)rc   Z DistilBertForTokenClassification)rl   ZElectraForTokenClassification)rn   ZErnieForTokenClassification)ro   ZErnieMForTokenClassification)rp   ZEsmForTokenClassification)rq   ZFalconForTokenClassification)rv   ZFlaubertForTokenClassification)rx   ZFNetForTokenClassification)r|   ZFunnelForTokenClassification)r~   ZGemmaForTokenClassification)r   ZGemma2ForTokenClassification)r   ZGlmForTokenClassification)r   ZGlm4ForTokenClassification)r   GPT2ForTokenClassification)r   r  )r   Z GPTBigCodeForTokenClassification)r   ZGPTNeoForTokenClassification)r   ZGPTNeoXForTokenClassification)r   ZHeliumForTokenClassification)r   ZIBertForTokenClassification)r   ZLayoutLMForTokenClassification)r   Z LayoutLMv2ForTokenClassification)r   Z LayoutLMv3ForTokenClassification)r   ZLiltForTokenClassification)r   ZLlamaForTokenClassification)r   Z LongformerForTokenClassification)r   ZLukeForTokenClassification)r   ZMarkupLMForTokenClassification)r   ZMegaForTokenClassification)r   Z"MegatronBertForTokenClassification)r   ZMistralForTokenClassification)r   ZMixtralForTokenClassification)r   Z MobileBertForTokenClassification)r   Z ModernBertForTokenClassification)r   ZMPNetForTokenClassification)r   ZMptForTokenClassification)r   ZMraForTokenClassification)r   ZMT5ForTokenClassification)r   ZNemotronForTokenClassification)r   ZNezhaForTokenClassification)r   Z#NystromformerForTokenClassification)r   ZPersimmonForTokenClassification)r   ZPhiForTokenClassification)r   ZPhi3ForTokenClassification)r
  ZQDQBertForTokenClassification)r  ZQwen2ForTokenClassification)r  ZQwen2MoeForTokenClassification)r  ZQwen3ForTokenClassification)r  ZQwen3MoeForTokenClassification)r  ZRemBertForTokenClassification)r  ZRobertaForTokenClassification)r  Z)RobertaPreLayerNormForTokenClassification)r   ZRoCBertForTokenClassification)r"  ZRoFormerForTokenClassification)r8  Z!SqueezeBertForTokenClassification)r9  ZStableLmForTokenClassification)r:  Z Starcoder2ForTokenClassification)rD  ZT5ForTokenClassification)rR  ZUMT5ForTokenClassification)rq  ZXLMForTokenClassification)rt  Z XLMRobertaForTokenClassification)rv  Z"XLMRobertaXLForTokenClassification)rw  ZXLNetForTokenClassification)rx  ZXmodForTokenClassification)r{  ZYosoForTokenClassification)&)r   ZAlbertForMultipleChoice)r   ZBertForMultipleChoice)r   ZBigBirdForMultipleChoice)r*   ZCamembertForMultipleChoice)r+   ZCanineForMultipleChoice)r:   ZConvBertForMultipleChoice)rH   ZData2VecTextForMultipleChoice)rO   ZDebertaV2ForMultipleChoice)rc   ZDistilBertForMultipleChoice)rl   ZElectraForMultipleChoice)rn   ZErnieForMultipleChoice)ro   ZErnieMForMultipleChoice)rv   ZFlaubertForMultipleChoice)rx   ZFNetForMultipleChoice)r|   ZFunnelForMultipleChoice)r   ZIBertForMultipleChoice)r   ZLongformerForMultipleChoice)r   ZLukeForMultipleChoice)r   ZMegaForMultipleChoice)r   ZMegatronBertForMultipleChoice)r   ZMobileBertForMultipleChoice)r   ZMPNetForMultipleChoice)r   ZMraForMultipleChoice)r   ZNezhaForMultipleChoice)r   ZNystromformerForMultipleChoice)r
  ZQDQBertForMultipleChoice)r  ZRemBertForMultipleChoice)r  ZRobertaForMultipleChoice)r  Z$RobertaPreLayerNormForMultipleChoice)r   ZRoCBertForMultipleChoice)r"  ZRoFormerForMultipleChoice)r8  ZSqueezeBertForMultipleChoice)rq  ZXLMForMultipleChoice)rt  ZXLMRobertaForMultipleChoice)rv  ZXLMRobertaXLForMultipleChoice)rw  ZXLNetForMultipleChoice)rx  ZXmodForMultipleChoice)r{  ZYosoForMultipleChoice))r   ZBertForNextSentencePrediction)rn   ZErnieForNextSentencePrediction)rx   ZFNetForNextSentencePrediction)r   Z%MegatronBertForNextSentencePrediction)r   Z#MobileBertForNextSentencePrediction)r   ZNezhaForNextSentencePrediction)r
  Z QDQBertForNextSentencePrediction))r   ZASTForAudioClassification)rF   Z&Data2VecAudioForSequenceClassification)r   ZHubertForSequenceClassification)r,  ZSEWForSequenceClassification)r-  ZSEWDForSequenceClassification)rS  Z"UniSpeechForSequenceClassification)rT  Z%UniSpeechSatForSequenceClassification)rj  Z!Wav2Vec2ForSequenceClassification)rk  Z%Wav2Vec2BertForSequenceClassification)rl  Z*Wav2Vec2ConformerForSequenceClassification)rm  ZWavLMForSequenceClassification)rn  ZWhisperForAudioClassification))rF   ZData2VecAudioForCTC)r   ZHubertForCTC)r   ZMCTCTForCTC)r,  Z	SEWForCTC)r-  Z
SEWDForCTC)rS  ZUniSpeechForCTC)rT  ZUniSpeechSatForCTC)rj  ZWav2Vec2ForCTC)rk  ZWav2Vec2BertForCTC)rl  ZWav2Vec2ConformerForCTC)rm  ZWavLMForCTC))rF   Z(Data2VecAudioForAudioFrameClassification)rT  Z'UniSpeechSatForAudioFrameClassification)rj  Z#Wav2Vec2ForAudioFrameClassification)rk  Z'Wav2Vec2BertForAudioFrameClassification)rl  Z,Wav2Vec2ConformerForAudioFrameClassification)rm  Z WavLMForAudioFrameClassification))rF   ZData2VecAudioForXVector)rT  ZUniSpeechSatForXVector)rj  ZWav2Vec2ForXVector)rk  ZWav2Vec2BertForXVector)rl  ZWav2Vec2ConformerForXVector)rm  ZWavLMForXVectorrs   )r5  ZSpeechT5ForTextToSpeech)	r   r@   )rt   ZFastSpeech2ConformerWithHifiGan)r   Z MusicgenForConditionalGeneration)r   Z&MusicgenMelodyForConditionalGeneration)Zqwen2_5_omniZ#Qwen2_5OmniForConditionalGeneration)r(  ZSeamlessM4TForTextToSpeech)r)  ZSeamlessM4Tv2ForTextToSpeechrg  )	r   r   r%   )r'   ZBlip2ForImageTextRetrievalr-   r/   r2   r.  r0  ))r   ZBeitBackbone)r!   ZBitBackbone)r<   ZConvNextBackbone)r>   ZConvNextV2Backbone)r]   ZDinatBackbone)r_   ZDinov2Backbone)ra   ZDinov2WithRegistersBackbone)rz   ZFocalNetBackboner   )r   ZHieraBackbone)r   ZMaskFormerSwinBackbone)r   ZNatBackbone)r	  ZPvtV2Backbone)r  ZResNetBackbone)Zrt_detr_resnetZRTDetrResNetBackbone)r>  ZSwinBackbone)rB  ZSwinv2Backbone)rH  ZTextNetBackbonerL  )rf  ZVitDetBackbone)Zvitpose_backboneZVitPoseBackboner&  r'  )Z
superpointZSuperPointForKeypointDetection)r   r   r   r1   rG   rL   rN   rb   rk   )rm   ZEmu3TextModelru   r   )r   r   r   )r   ZMllamaTextModelr   )r   ZMT5EncoderModelr   r  r  r  r  r  r!  r7  )rD  ZT5EncoderModel)rR  ZUMT5EncoderModelrp  rs  ru  )r   Z'PatchTSMixerForTimeSeriesClassification)r   ZPatchTSTForClassification)r   ZPatchTSMixerForRegression)r   ZPatchTSTForRegression)rI  ZTimesFmModelForPrediction)r@  ZSwin2SRForImageSuperResolutionc                   @      e Zd ZeZdS )AutoModelForMaskGenerationN)__name__
__module____qualname__!MODEL_FOR_MASK_GENERATION_MAPPING_model_mapping r  r  U/var/www/auris/lib/python3.10/site-packages/transformers/models/auto/modeling_auto.pyr        r  c                   @   r  )AutoModelForKeypointDetectionN)r  r  r  $MODEL_FOR_KEYPOINT_DETECTION_MAPPINGr  r  r  r  r   r    r  r  c                   @   r  )AutoModelForTextEncodingN)r  r  r  MODEL_FOR_TEXT_ENCODING_MAPPINGr  r  r  r  r   r    r  r  c                   @   r  )AutoModelForImageToImageN)r  r  r   MODEL_FOR_IMAGE_TO_IMAGE_MAPPINGr  r  r  r  r   r    r  r  c                   @   r  )	AutoModelN)r  r  r  MODEL_MAPPINGr  r  r  r  r   r    r  r  c                   @   r  )AutoModelForPreTrainingN)r  r  r  MODEL_FOR_PRETRAINING_MAPPINGr  r  r  r  r   r
    r  r
  Zpretraining)head_docc                   @   r  )_AutoModelWithLMHeadN)r  r  r  MODEL_WITH_LM_HEAD_MAPPINGr  r  r  r  r   r    r  r  zlanguage modelingc                   @   r  )AutoModelForCausalLMN)r  r  r  MODEL_FOR_CAUSAL_LM_MAPPINGr  r  r  r  r   r    r  r  zcausal language modelingc                   @   r  )AutoModelForMaskedLMN)r  r  r  MODEL_FOR_MASKED_LM_MAPPINGr  r  r  r  r   r    r  r  zmasked language modelingc                   @   r  )AutoModelForSeq2SeqLMN)r  r  r  &MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPINGr  r  r  r  r   r    r  r  z&sequence-to-sequence language modelingzgoogle-t5/t5-base)r  Zcheckpoint_for_examplec                   @   r  )"AutoModelForSequenceClassificationN)r  r  r  )MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPINGr  r  r  r  r   r    r  r  zsequence classificationc                   @   r  )AutoModelForQuestionAnsweringN)r  r  r  $MODEL_FOR_QUESTION_ANSWERING_MAPPINGr  r  r  r  r   r    r  r  zquestion answeringc                   @   r  )"AutoModelForTableQuestionAnsweringN)r  r  r  *MODEL_FOR_TABLE_QUESTION_ANSWERING_MAPPINGr  r  r  r  r   r    r  r  ztable question answeringzgoogle/tapas-base-finetuned-wtqc                   @   r  )#AutoModelForVisualQuestionAnsweringN)r  r  r  +MODEL_FOR_VISUAL_QUESTION_ANSWERING_MAPPINGr  r  r  r  r   r  	  r  r  zvisual question answeringzdandelin/vilt-b32-finetuned-vqac                   @   r  )%AutoModelForDocumentQuestionAnsweringN)r  r  r  -MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPINGr  r  r  r  r   r    r  r  zdocument question answeringz/impira/layoutlm-document-qa", revision="52e01b3c                   @   r  )AutoModelForTokenClassificationN)r  r  r  &MODEL_FOR_TOKEN_CLASSIFICATION_MAPPINGr  r  r  r  r   r    r  r  ztoken classificationc                   @   r  )AutoModelForMultipleChoiceN)r  r  r  !MODEL_FOR_MULTIPLE_CHOICE_MAPPINGr  r  r  r  r   r!  &  r  r!  zmultiple choicec                   @   r  )"AutoModelForNextSentencePredictionN)r  r  r  *MODEL_FOR_NEXT_SENTENCE_PREDICTION_MAPPINGr  r  r  r  r   r#  -  r  r#  znext sentence predictionc                   @   r  )AutoModelForImageClassificationN)r  r  r  &MODEL_FOR_IMAGE_CLASSIFICATION_MAPPINGr  r  r  r  r   r%  6  r  r%  zimage classificationc                   @   r  )'AutoModelForZeroShotImageClassificationN)r  r  r  0MODEL_FOR_ZERO_SHOT_IMAGE_CLASSIFICATION_MAPPINGr  r  r  r  r   r'  =  r  r'  zzero-shot image classificationc                   @   r  )AutoModelForImageSegmentationN)r  r  r  $MODEL_FOR_IMAGE_SEGMENTATION_MAPPINGr  r  r  r  r   r)  F  r  r)  zimage segmentationc                   @   r  ) AutoModelForSemanticSegmentationN)r  r  r  'MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPINGr  r  r  r  r   r+  M  r  r+  zsemantic segmentationc                   @   r  ) AutoModelForTimeSeriesPredictionN)r  r  r  (MODEL_FOR_TIME_SERIES_PREDICTION_MAPPINGr  r  r  r  r   r-  V  r  r-  ztime-series predictionc                   @   r  )!AutoModelForUniversalSegmentationN)r  r  r  (MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPINGr  r  r  r  r   r/  _  r  r/  zuniversal image segmentationc                   @   r  ) AutoModelForInstanceSegmentationN)r  r  r  'MODEL_FOR_INSTANCE_SEGMENTATION_MAPPINGr  r  r  r  r   r1  h  r  r1  zinstance segmentationc                   @   r  )AutoModelForObjectDetectionN)r  r  r  "MODEL_FOR_OBJECT_DETECTION_MAPPINGr  r  r  r  r   r3  q  r  r3  zobject detectionc                   @   r  )#AutoModelForZeroShotObjectDetectionN)r  r  r  ,MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPINGr  r  r  r  r   r5  x  r  r5  zzero-shot object detectionc                   @   r  )AutoModelForDepthEstimationN)r  r  r  "MODEL_FOR_DEPTH_ESTIMATION_MAPPINGr  r  r  r  r   r7    r  r7  zdepth estimationc                   @   r  )AutoModelForVideoClassificationN)r  r  r  &MODEL_FOR_VIDEO_CLASSIFICATION_MAPPINGr  r  r  r  r   r9    r  r9  zvideo classificationc                   @   r  )AutoModelForVision2SeqN)r  r  r  MODEL_FOR_VISION_2_SEQ_MAPPINGr  r  r  r  r   r;    r  r;  zvision-to-text modelingc                   @   r  )AutoModelForImageTextToTextN)r  r  r  $MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPINGr  r  r  r  r   r=    r  r=  zimage-text-to-text modelingc                   @   r  )AutoModelForAudioClassificationN)r  r  r  &MODEL_FOR_AUDIO_CLASSIFICATION_MAPPINGr  r  r  r  r   r?    r  r?  zaudio classificationc                   @   r  )AutoModelForCTCN)r  r  r  MODEL_FOR_CTC_MAPPINGr  r  r  r  r   rA    r  rA  z%connectionist temporal classificationc                   @   r  )AutoModelForSpeechSeq2SeqN)r  r  r  "MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPINGr  r  r  r  r   rC    r  rC  z,sequence-to-sequence speech-to-text modelingc                   @   r  )$AutoModelForAudioFrameClassificationN)r  r  r  ,MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPINGr  r  r  r  r   rE    r  rE  z"audio frame (token) classificationc                   @   r  )AutoModelForAudioXVectorN)r  r  r  MODEL_FOR_AUDIO_XVECTOR_MAPPINGr  r  r  r  r   rG    r  rG  c                   @   r  )AutoModelForTextToSpectrogramN)r  r  r  %MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPINGr  r  r  r  r   rI    r  rI  c                   @   r  )AutoModelForTextToWaveformN)r  r  r  "MODEL_FOR_TEXT_TO_WAVEFORM_MAPPINGr  r  r  r  r   rK    r  rK  c                   @   r  )AutoBackboneN)r  r  r  MODEL_FOR_BACKBONE_MAPPINGr  r  r  r  r   rM    r  rM  zaudio retrieval via x-vectorc                   @   r  )AutoModelForMaskedImageModelingN)r  r  r  'MODEL_FOR_MASKED_IMAGE_MODELING_MAPPINGr  r  r  r  r   rO    r  rO  zmasked image modelingc                       s0   e Zd Ze fddZe fddZ  ZS )AutoModelWithLMHeadc                    s   t dt t |S NzThe class `AutoModelWithLMHead` is deprecated and will be removed in a future version. Please use `AutoModelForCausalLM` for causal language models, `AutoModelForMaskedLM` for masked language models and `AutoModelForSeq2SeqLM` for encoder-decoder models.)warningswarnFutureWarningsuperfrom_config)clsconfig	__class__r  r   rW    s
   zAutoModelWithLMHead.from_configc                    s&   t dt t j|g|R i |S rR  )rS  rT  rU  rV  from_pretrained)rX  Zpretrained_model_name_or_pathZ
model_argskwargsrZ  r  r   r\    s
   z#AutoModelWithLMHead.from_pretrained)r  r  r  classmethodrW  r\  __classcell__r  r  rZ  r   rQ    s
    	rQ  )Tr@  rF  rH  rN  'MODEL_FOR_CAUSAL_IMAGE_MODELING_MAPPINGr  rB  r  r8  r&  MODEL_FOR_IMAGE_MAPPINGr*  r  r  r2  rP  r  r  r"  r$  r4  r  r  r,  r  r  rD  r  r  rL  rJ  r.  r   r0  r:  r<  MODEL_FOR_RETRIEVAL_MAPPINGr>  r  r	  r  r(  r6  ,MODEL_FOR_TIME_SERIES_CLASSIFICATION_MAPPING(MODEL_FOR_TIME_SERIES_REGRESSION_MAPPINGr  rM  r?  rE  rG  r  rA  r7  r%  r)  r  r1  r  r  r  rO  r  r!  r#  r3  r
  r  r+  r  r  rC  r  rI  rK  r  r/  r9  r;  r  r  rQ  r'  r5  r=  )__doc__rS  collectionsr   utilsr   Zauto_factoryr   r   r   r	   Zconfiguration_autor
   Z
get_loggerr  loggerZMODEL_MAPPING_NAMESZ#MODEL_FOR_PRETRAINING_MAPPING_NAMESZ MODEL_WITH_LM_HEAD_MAPPING_NAMESZ!MODEL_FOR_CAUSAL_LM_MAPPING_NAMESZMODEL_FOR_IMAGE_MAPPING_NAMESZ-MODEL_FOR_MASKED_IMAGE_MODELING_MAPPING_NAMESZ-MODEL_FOR_CAUSAL_IMAGE_MODELING_MAPPING_NAMESZ,MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMESZ*MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMESZ-MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMESZ-MODEL_FOR_INSTANCE_SEGMENTATION_MAPPING_NAMESZ.MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMESZ,MODEL_FOR_VIDEO_CLASSIFICATION_MAPPING_NAMESZ$MODEL_FOR_VISION_2_SEQ_MAPPING_NAMESZ!MODEL_FOR_RETRIEVAL_MAPPING_NAMESZ*MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMESZ!MODEL_FOR_MASKED_LM_MAPPING_NAMESZ(MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMESZ2MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMESZ(MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMESZ,MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMESZ(MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMESZ/MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMESZ*MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMESZ0MODEL_FOR_TABLE_QUESTION_ANSWERING_MAPPING_NAMESZ1MODEL_FOR_VISUAL_QUESTION_ANSWERING_MAPPING_NAMESZ3MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMESZ,MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMESZ'MODEL_FOR_MULTIPLE_CHOICE_MAPPING_NAMESZ0MODEL_FOR_NEXT_SENTENCE_PREDICTION_MAPPING_NAMESZ,MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMESZMODEL_FOR_CTC_MAPPING_NAMESZ2MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMESZ%MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMESZ+MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMESZ(MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMESZ6MODEL_FOR_ZERO_SHOT_IMAGE_CLASSIFICATION_MAPPING_NAMESZ MODEL_FOR_BACKBONE_MAPPING_NAMESZ'MODEL_FOR_MASK_GENERATION_MAPPING_NAMESZ*MODEL_FOR_KEYPOINT_DETECTION_MAPPING_NAMESZ%MODEL_FOR_TEXT_ENCODING_MAPPING_NAMESZ2MODEL_FOR_TIME_SERIES_CLASSIFICATION_MAPPING_NAMESZ.MODEL_FOR_TIME_SERIES_REGRESSION_MAPPING_NAMESZ.MODEL_FOR_TIME_SERIES_PREDICTION_MAPPING_NAMESZ&MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMESr	  r  r  r  r`  r&  r(  r*  r,  r2  r0  r:  r<  r>  rb  r  r  r  ra  rP  r4  r6  r8  r  r  r  r  r   r"  r$  r@  rB  rD  rF  rH  rJ  rL  rN  r  r  r  rc  rd  r.  r  r  r  r  r  r  r
  r  r  r  r  r  r  r  r  r  r  r!  r#  r%  r'  r)  r+  r-  r/  r1  r3  r5  r7  r9  r;  r=  r?  rA  rC  rE  rG  rI  rK  rM  rO  rQ  __all__r  r  r  r   <module>   s  
  GWWu=E
'4
!hNT,#


















