
    <h~p                    d   S r SSKrSSKrSSKJr  SSKJrJr  SSKJ	r	  SSK
JrJrJrJr  SS	KJr  \(       a  SS
KJr  SSKJr   " S S\\5      r\	R,                  " \5      r\" / SQ5      r\" / SQ5      r\" / SQ5      r\" / SQ5      r\" / SQ5      r\" / SQ5      r\" S/5      r\" / SQ5      r \" S/5      r!\" / SQ5      r"\" S/5      r#\" / SQ5      r$\" / SQ5      r%\" / SQ5      r&\" S/5      r'\" / SQ5      r(\" / SQ5      r)\" / SQ5      r*\" / S Q5      r+\" / S!Q5      r,\" / S"Q5      r-\" / S#Q5      r.\" / S$Q5      r/\" / S%Q5      r0\" S&/5      r1\" / S'Q5      r2\" / S(Q5      r3\" / S)Q5      r4\" / S*Q5      r5\" / S+Q5      r6\" / S,Q5      r7\" / S-Q5      r8\" / S.Q5      r9\" / S/Q5      r:\" S0S1/5      r;\" / S2Q5      r<\" / S3Q5      r=\" / S4Q5      r>\" S5S6/5      r?\" S7/5      r@\" / S8Q5      rA\" / S9Q5      rB\" S:S;/5      rC\" S<S=/5      rD\" S>/5      rE\" S?/5      rF\" S@/5      rG\" \\5      rH\" \\5      rI\" \\5      rJ\" \\5      rK\" \\5      rL\" \\ 5      rM\" \\=5      rN\" \\!5      rO\" \\"5      rP\" \\#5      rQ\" \\$5      rR\" \\%5      rS\" \\&5      rT\" \\(5      rU\" \\'5      rV\" \\25      rW\" \\35      rX\" \\)5      rY\" \\5      rZ\" \\5      r[\" \\*5      r\\" \\+5      r]\" \\,5      r^\" \\-5      r_\" \\/5      r`\" \\05      ra\" \\15      rb\" \\45      rc\" \\55      rd\" \\65      re\" \\75      rf\" \\85      rg\" \\.5      rh\" \\95      ri\" \\:5      rj\" \\;5      rk\" \\<5      rl\" \\>5      rm\" \\?5      rn\" \\@5      ro\" \\A5      rp\" \\B5      rq\" \\C5      rr\" \\D5      rs\" \\E5      rt\" \\F5      ru\" \\G5      rv " SA SB\5      rw " SC SD\5      rx " SE SF\5      ry " SG SH\5      rz " SI SJ\5      r{ " SK SL\5      r|\" \|5      r| " SM SN\5      r}\" \}SOSP9r} " SQ SR\5      r~\" \~SSSP9r~ " ST SU\5      r\" \SVSP9r " SW SX\5      r\" \SYSP9r " SZ S[\5      r\" \S\S]S^9r " S_ S`\5      r\" \SaSP9r " Sb Sc\5      r\" \SdSP9r " Se Sf\5      r\" \SgShS^9r " Si Sj\5      r\" \SkSlS^9r " Sm Sn\5      r\" \SoSpS^9r " Sq Sr\5      r\" \SsSP9r " St Su\5      r\" \SvSP9r " Sw Sx\5      r\" \SySP9r " Sz S{\5      r\" \S|SP9r " S} S~\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r " S S\5      r " S S\5      r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\5      r\" \SSP9r " S S\~5      r " S S\5      r/ SQrg)zAuto Model class.    N)OrderedDict)TYPE_CHECKINGUnion   )logging   )_BaseAutoBackboneClass_BaseAutoModelClass_LazyAutoMappingauto_class_update)CONFIG_MAPPING_NAMES)GenerationMixin)PreTrainedModelc                       \ rS rSrSrg)_BaseModelWithGenerate%    N)__name__
__module____qualname____firstlineno____static_attributes__r       ^/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/auto/modeling_auto.pyr   r   %   s    r   r   (e  )aimv2
Aimv2Modelaimv2_vision_modelAimv2VisionModelalbertAlbertModelalign
AlignModelaltclipAltCLIPModel)arcee
ArceeModel)aria	AriaModel)	aria_textAriaTextModel)audio-spectrogram-transformerASTModel)
autoformerAutoformerModel)
aya_visionAyaVisionModel)bamba
BambaModelbark	BarkModel)bart	BartModelbeit	BeitModelbert	BertModel)bert-generationBertGenerationEncoderbig_birdBigBirdModel)bigbird_pegasusBigBirdPegasusModel)biogptBioGptModelbitBitModel)bitnetBitNetModel)
blenderbotBlenderbotModel)blenderbot-smallBlenderbotSmallModelblip	BlipModel)blip-2
Blip2Model)blip_2_qformerBlip2QFormerModel)bloom
BloomModel)bridgetowerBridgeTowerModel)bros	BrosModel)	camembertCamembertModel)canineCanineModel)	chameleonChameleonModelchinese_clipChineseCLIPModel)chinese_clip_vision_modelChineseCLIPVisionModel)clap	ClapModelclip	CLIPModelclip_text_modelCLIPTextModel)clip_vision_modelCLIPVisionModelclipsegCLIPSegModel)clvp!ClvpModelForConditionalGeneration)
code_llama
LlamaModel)codegenCodeGenModel)cohereCohereModel)cohere2Cohere2Modelcohere2_visionCohere2VisionModelconditional_detrConditionalDetrModel)convbertConvBertModelconvnextConvNextModel
convnextv2ConvNextV2Model)cpmantCpmAntModelcsmCsmForConditionalGeneration)ctrl	CTRLModel)cvtCvtModel)d_fine
DFineModeldab-detrDabDetrModeldacDacModel)data2vec-audioData2VecAudioModeldata2vec-textData2VecTextModeldata2vec-visionData2VecVisionModel)dbrx	DbrxModeldebertaDebertaModel
deberta-v2DebertaV2Model)decision_transformerDecisionTransformerModel)deepseek_v2DeepseekV2Model)deepseek_v3DeepseekV3Model)deepseek_vlDeepseekVLModel)deepseek_vl_hybridDeepseekVLHybridModeldeformable_detrDeformableDetrModeldeit	DeiTModel	depth_proDepthProModeldeta	DetaModeldetr	DetrModel)diaDiaModel)	diffllamaDiffLlamaModeldinat
DinatModeldinov2Dinov2Modeldinov2_with_registersDinov2WithRegistersModel
distilbertDistilBertModel)doge	DogeModel)
donut-swinDonutSwinModel)dots1
Dots1Model)dprDPRQuestionEncoderdptDPTModelefficientformerEfficientFormerModel)efficientloftrEfficientLoFTRModelefficientnetEfficientNetModelelectraElectraModel)emu3	Emu3Model)encodecEncodecModel)ernie
ErnieModel)ernie4_5Ernie4_5Model)ernie4_5_moeErnie4_5_MoeModel)ernie_mErnieMModel)esmEsmModel)evollaEvollaModel)exaone4Exaone4Model)falconFalconModel)	falcon_h1FalconH1Model)falcon_mambaFalconMambaModelfastspeech2_conformerFastSpeech2ConformerModel"fastspeech2_conformer_with_hifiganFastSpeech2ConformerWithHifiGanflaubertFlaubertModel)flava
FlavaModel)fnet	FNetModelfocalnetFocalNetModel)fsmt	FSMTModel)funnel)FunnelModelFunnelBaseModel)fuyu	FuyuModel)gemma
GemmaModel)gemma2Gemma2Model)gemma3Gemma3Model)gemma3_textGemma3TextModel)gemma3nGemma3nModel)gemma3n_audioGemma3nAudioEncoder)gemma3n_textGemma3nTextModel)gemma3n_visionTimmWrapperModel)gitGitModel)glmGlmModel)glm4	Glm4Model)glm4_moeGlm4MoeModel)glm4v
Glm4vModel)
glm4v_textGlm4vTextModelglpn	GLPNModel)got_ocr2GotOcr2Model)gpt-sw3	GPT2Model)gpt2rB  )gpt_bigcodeGPTBigCodeModel)gpt_neoGPTNeoModel)gpt_neoxGPTNeoXModel)gpt_neox_japaneseGPTNeoXJapaneseModel)gpt_ossGptOssModel)gptj	GPTJModelzgptsan-japanese&GPTSanJapaneseForConditionalGeneration)graniteGraniteModel)
granitemoeGraniteMoeModel)granitemoehybridGraniteMoeHybridModel)granitemoesharedGraniteMoeSharedModel)
graphormerGraphormerModel)grounding-dinoGroundingDinoModel)groupvitGroupViTModel)heliumHeliumModelhgnet_v2HGNetV2Backbonehiera
HieraModel)hubertHubertModelibert
IBertModel)ideficsIdeficsModel)idefics2Idefics2Model)idefics3Idefics3Model)idefics3_visionIdefics3VisionTransformerijepa
IJepaModelimagegptImageGPTModel)informerInformerModel)instructblipInstructBlipModel)instructblipvideoInstructBlipVideoModel)internvlInternVLModel)internvl_visionInternVLVisionModel)jamba
JambaModel)janus
JanusModel)jetmoeJetMoeModel)jukeboxJukeboxModel)kosmos-2Kosmos2Model)kyutai_speech_to_textKyutaiSpeechToTextModel)layoutlmLayoutLMModel)
layoutlmv2LayoutLMv2Model)
layoutlmv3LayoutLMv3Model)ledLEDModellevit
LevitModel)lfm2	Lfm2Model	lightglueLightGlueForKeypointMatching)lilt	LiltModel)llamar|   llama4Llama4ForConditionalGeneration)llama4_textLlama4TextModel)llava
LlavaModel)
llava_nextLlavaNextModel)llava_next_videoLlavaNextVideoModel)llava_onevisionLlavaOnevisionModel
longformerLongformerModel)longt5LongT5Model)luke	LukeModel)lxmertLxmertModel)m2m_100M2M100Model)mamba
MambaModel)mamba2Mamba2Model)marianMarianModel)markuplmMarkupLMModel)mask2formerMask2FormerModel)
maskformerMaskFormerModel)maskformer-swinMaskFormerSwinModel)mbart
MBartModel)mctct
MCTCTModel)mega	MegaModel)megatron-bertMegatronBertModel)zmgp-strMgpstrForSceneTextRecognition)mimi	MimiModel)minimaxMiniMaxModel)mistralMistralModel)mistral3Mistral3Model)mixtralMixtralModelmlcdMLCDVisionModel)mllamaMllamaModel)mm-grounding-dinoMMGroundingDinoModel
mobilebertMobileBertModelmobilenet_v1MobileNetV1Modelmobilenet_v2MobileNetV2Model	mobilevitMobileViTModelmobilevitv2MobileViTV2Model)
modernbertModernBertModel)modernbert-decoderModernBertDecoderModel)	moonshineMoonshineModel)moshi
MoshiModel)mpnet
MPNetModel)mptMptModel)mraMraModel)mt5MT5Model)musicgenMusicgenModel)musicgen_melodyMusicgenMelodyModel)mvpMvpModelnatNatModel)nemotronNemotronModel)nezha
NezhaModel)nllb-moeNllbMoeModelnystromformerNystromformerModel)olmo	OlmoModel)olmo2
Olmo2Model)olmoe
OlmoeModelzomdet-turboOmDetTurboForObjectDetection)	oneformerOneFormerModel)
open-llamaOpenLlamaModel)
openai-gptOpenAIGPTModel)optOPTModel)owlv2
Owlv2Model)owlvitOwlViTModel)	paligemmaPaliGemmaModel)patchtsmixerPatchTSMixerModel)patchtstPatchTSTModel)pegasusPegasusModel)	pegasus_xPegasusXModel)	perceiverPerceiverModel)perception_encoderPerceptionEncoder)perception_lmPerceptionLMModel)	persimmonPersimmonModel)phiPhiModel)phi3	Phi3Model)phi4_multimodalPhi4MultimodalModel)phimoePhimoeModel)pixtralPixtralVisionModel)plbartPLBartModel
poolformerPoolFormerModel)
prophetnetProphetNetModelpvtPvtModel)pvt_v2
PvtV2Model)qdqbertQDQBertModel)qwen2
Qwen2Model)
qwen2_5_vlQwen2_5_VLModel)qwen2_5_vl_textQwen2_5_VLTextModel)qwen2_audio_encoderQwen2AudioEncoder)	qwen2_moeQwen2MoeModel)qwen2_vlQwen2VLModel)qwen2_vl_textQwen2VLTextModel)qwen3
Qwen3Model)	qwen3_moeQwen3MoeModel)recurrent_gemmaRecurrentGemmaModelreformerReformerModelregnetRegNetModelrembertRemBertModelresnetResNetModel	retribertRetriBertModelrobertaRobertaModelroberta-prelayernormRobertaPreLayerNormModelroc_bertRoCBertModelroformerRoFormerModel)rt_detrRTDetrModel)
rt_detr_v2RTDetrV2Model)rwkv	RwkvModelsamSamModelsam_hq
SamHQModel)sam_hq_vision_modelSamHQVisionModel)sam_vision_modelSamVisionModel)seamless_m4tSeamlessM4TModel)seamless_m4t_v2SeamlessM4Tv2Model	segformerSegformerModel)seggptSegGptModel)sewSEWModel)sew-d	SEWDModelsiglipSiglipModelsiglip2Siglip2Modelsiglip_vision_modelSiglipVisionModel)smollm3SmolLM3Model)smolvlmSmolVLMModel)smolvlm_visionSmolVLMVisionTransformer)speech_to_textSpeech2TextModel)speecht5SpeechT5Model)splinterSplinterModelsqueezebertSqueezeBertModel)stablelmStableLmModel)
starcoder2Starcoder2ModelswiftformerSwiftFormerModelswin	SwinModelswin2srSwin2SRModelswinv2Swinv2Model)switch_transformersSwitchTransformersModel)t5T5Model)t5gemmaT5GemmaModeltable-transformerTableTransformerModel)tapas
TapasModel)textnetTextNetModel)time_series_transformerTimeSeriesTransformerModel)timesfmTimesFmModeltimesformerTimesformerModeltimm_backboneTimmBackbonetimm_wrapperr/  )trajectory_transformerTrajectoryTransformerModel)
transfo-xlTransfoXLModel)tvlt	TvltModel)tvpTvpModel)udop	UdopModel)umt5	UMT5Model)	unispeechUniSpeechModel)unispeech-satUniSpeechSatModel)univnetUnivNetModelvanVanModel)video_llavaVideoLlavaModelvideomaeVideoMAEModel)vilt	ViltModel)vipllavaVipLlavaModel)zvision-text-dual-encoderVisionTextDualEncoderModel)visual_bertVisualBertModelvitViTModel
vit_hybridViTHybridModelvit_maeViTMAEModelvit_msnViTMSNModelvitdetVitDetModelvits	VitsModelvivit
VivitModel)vjepa2VJEPA2ModelvoxtralVoxtralForConditionalGeneration)voxtral_encoderVoxtralEncoder)wav2vec2Wav2Vec2Model)wav2vec2-bertWav2Vec2BertModel)wav2vec2-conformerWav2Vec2ConformerModel)wavlm
WavLMModel)whisperWhisperModel)xclip
XCLIPModel)xglm	XGLMModelxlmXLMModel)xlm-prophetnetXLMProphetNetModelxlm-robertaXLMRobertaModelxlm-roberta-xlXLMRobertaXLModel)xlnet
XLNetModel)xlstm
xLSTMModel)xmod	XmodModelyolos
YolosModel)yoso	YosoModel)zamba
ZambaModel)zamba2Zamba2Model)W)r!   AlbertForPreTrainingr:   BartForConditionalGeneration)r@   BertForPreTraining)rE   BigBirdForPreTrainingr[   BloomForCausalLMra   CamembertForMaskedLMcolpaliColPaliForRetrieval)colqwen2ColQwen2ForRetrievalr   CTRLLMHeadModelr   Data2VecTextForMaskedLMr   DebertaForMaskedLMr   DebertaV2ForMaskedLMr   DistilBertForMaskedLM)r   ElectraForPreTraining)r   ErnieForPreTrainingr   EvollaForProteinText2Textr  Exaone4ForCausalLMr  FalconMambaForCausalLMr  FlaubertWithLMHeadModel)r  FlavaForPreTraining)r  FNetForPreTrainingr  FSMTForConditionalGeneration)r  FunnelForPreTrainingr$  Gemma3ForConditionalGenerationrA  GPT2LMHeadModelrC  ro  rD  GPTBigCodeForCausalLMrP  )rf  HieraForPreTrainingrk  IBertForMaskedLMrm  IdeficsForVisionText2Textro   Idefics2ForConditionalGenerationrq   Idefics3ForConditionalGenerationr  JanusForConditionalGenerationr  LayoutLMForMaskedLMr  LlavaForConditionalGenerationr  !LlavaNextForConditionalGenerationr  &LlavaNextVideoForConditionalGenerationr  &LlavaOnevisionForConditionalGenerationr  LongformerForMaskedLMr  LukeForMaskedLM)r  LxmertForPreTrainingr  MambaForCausalLMr  Mamba2ForCausalLMr  MegaForMaskedLM)r  MegatronBertForPreTrainingr   Mistral3ForConditionalGenerationr  MllamaForConditionalGeneration)r  MobileBertForPreTrainingr  MPNetForMaskedLMr  MptForCausalLMr  MraForMaskedLMr  MvpForConditionalGeneration)r  NezhaForPreTrainingr  NllbMoeForConditionalGenerationr!  OpenAIGPTLMHeadModelr)  !PaliGemmaForConditionalGenerationqwen2_audio"Qwen2AudioForConditionalGenerationrs  rw  RobertaForMaskedLMrz  RobertaPreLayerNormForMaskedLM)r}  RoCBertForPreTrainingr  RwkvForCausalLM)r  SplinterForPreTrainingr  SqueezeBertForMaskedLMr  *SwitchTransformersForConditionalGenerationr  T5ForConditionalGenerationr  T5GemmaForConditionalGenerationr  TapasForMaskedLMr  TransfoXLLMHeadModel)r  TvltForPreTraining)r  UniSpeechForPreTraining)r  UniSpeechSatForPreTrainingr  "VideoLlavaForConditionalGeneration)r  VideoMAEForPreTrainingr   VipLlavaForConditionalGeneration)r  VisualBertForPreTraining)r  ViTMAEForPreTrainingr  )r  Wav2Vec2ForPreTraining)r!  Wav2Vec2ConformerForPreTrainingr,  XLMWithLMHeadModelr1  XLMRobertaForMaskedLMr4  XLMRobertaXLForMaskedLMr6  XLNetLMHeadModelr8  xLSTMForCausalLMr:  XmodForMaskedLM)Tr!   AlbertForMaskedLMrF  r@   BertForMaskedLMrE   BigBirdForMaskedLMrG   &BigBirdPegasusForConditionalGenerationrR   'BlenderbotSmallForConditionalGenerationrJ  rL  r}   CodeGenForCausalLMr   ConvBertForMaskedLMr   CpmAntForCausalLMrS  rU  rW  rY  r   DiaForConditionalGenerationr[  r   ElectraForMaskedLMzencoder-decoderEncoderDecoderModelr   ErnieForMaskedLMr   EsmForMaskedLMra  rc  re  r  FNetForMaskedLMri  r  FunnelForMaskedLMr0  GitForCausalLMrn  rp  rq  rF  GPTNeoForCausalLMrH  GPTNeoXForCausalLMrJ  GPTNeoXJapaneseForCausalLMrN  GPTJForCausalLMrP  rt  r~  r  LEDForConditionalGenerationr  r  LongT5ForConditionalGenerationr  r  M2M100ForConditionalGenerationr  r  r  MarianMTModelr  r  MegatronBertForCausalLMr  MobileBertForMaskedLMr  !MoonshineForConditionalGenerationr  r  r  r  r  NezhaForMaskedLMr  r  NystromformerForMaskedLMr  r1   PegasusXForConditionalGenerationrE  PLBartForConditionalGeneration	pop2piano!Pop2PianoForConditionalGenerationrQ  QDQBertForMaskedLMrh  ReformerModelWithLMHeadrn  RemBertForMaskedLMr  r  r}  RoCBertForMaskedLMr  RoFormerForMaskedLMr  r  #Speech2TextForConditionalGenerationr  r  r  r  r  r  r  Wav2Vec2ForMaskedLMr%  WhisperForConditionalGenerationr  r  r  r  r  r?  YosoForMaskedLM))r)   ArceeForCausalLM)r-   AriaTextForCausalLM)r5   BambaForCausalLM)r:   BartForCausalLM)r@   BertLMHeadModel)rB   BertGenerationDecoder)rE   BigBirdForCausalLM)rG   BigBirdPegasusForCausalLM)rI   BioGptForCausalLM)rN   BitNetForCausalLM)rP   BlenderbotForCausalLM)rR   BlenderbotSmallForCausalLMrJ  )ra   CamembertForCausalLM)r{   LlamaForCausalLMr  )r   CohereForCausalLM)r   Cohere2ForCausalLMr  rS  )r   Data2VecTextForCausalLM)r   DbrxForCausalLM)r   DeepseekV2ForCausalLM)r   DeepseekV3ForCausalLM)r   DiffLlamaForCausalLM)r   DogeForCausalLM)r   Dots1ForCausalLM)r   ElectraForCausalLM)r   Emu3ForCausalLM)r   ErnieForCausalLM)r   Ernie4_5ForCausalLM)r   Ernie4_5_MoeForCausalLMra  )r  FalconForCausalLM)r  FalconH1ForCausalLMrc  r  FuyuForCausalLM)r   GemmaForCausalLM)r"  Gemma2ForCausalLMrl  )r&  Gemma3ForCausalLMr(  Gemma3nForConditionalGeneration)r,  Gemma3nForCausalLMr  )r2  GlmForCausalLM)r4  Glm4ForCausalLM)r6  Glm4MoeForCausalLMr?  GotOcr2ForConditionalGenerationrn  rp  rq  r  r  r  )rL  GptOssForCausalLMr  )rR  GraniteForCausalLM)rT  GraniteMoeForCausalLM)rV  GraniteMoeHybridForCausalLM)rX  GraniteMoeSharedForCausalLM)r`  HeliumForCausalLM)r  JambaForCausalLM)r  JetMoeForCausalLM)r  Lfm2ForCausalLM)r  r7  )r  Llama4ForCausalLM)r  r^  r  r  )r  MarianForCausalLM)r  MBartForCausalLM)r  MegaForCausalLMr  )r  MiniMaxForCausalLM)r  MistralForCausalLM)r  MixtralForCausalLM)r  MllamaForCausalLM)r  ModernBertDecoderForCausalLM)r  MoshiForCausalLMr  )r  MusicgenForCausalLM)r  MusicgenMelodyForCausalLM)r  MvpForCausalLM)r  NemotronForCausalLM)r  OlmoForCausalLM)r  Olmo2ForCausalLM)r  OlmoeForCausalLM)r  OpenLlamaForCausalLMr  )r#  OPTForCausalLM)r/  PegasusForCausalLM)r9  PersimmonForCausalLM)r;  PhiForCausalLM)r=  Phi3ForCausalLM)r?  Phi4MultimodalForCausalLM)rA  PhimoeForCausalLM)rE  PLBartForCausalLM)rJ  ProphetNetForCausalLM)rQ  QDQBertLMHeadModel)rS  Qwen2ForCausalLM)r[  Qwen2MoeForCausalLM)ra  Qwen3ForCausalLM)rc  Qwen3MoeForCausalLM)re  RecurrentGemmaForCausalLMr  )rn  RemBertForCausalLM)rw  RobertaForCausalLM)rz  RobertaPreLayerNormForCausalLM)r}  RoCBertForCausalLM)r  RoFormerForCausalLMr  )r  SmolLM3ForCausalLM)speech_to_text_2Speech2Text2ForCausalLM)r  StableLmForCausalLM)r  Starcoder2ForCausalLMr  )trocrTrOCRForCausalLM)r%  WhisperForCausalLM)r)  XGLMForCausalLMr  )r.  XLMProphetNetForCausalLM)r1  XLMRobertaForCausalLM)r4  XLMRobertaXLForCausalLMr  r  )r:  XmodForCausalLM)rA  ZambaForCausalLM)rC  Zamba2ForCausalLM)9r   r<   rK   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r  r<  re  ru  rx  r  )r  Llama4VisionModelr  )r  MllamaVisionModelr  r  r  r  r	  rG  rL  rj  rp  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r
  r  r  r<  ))r   DeiTForMaskedImageModeling)r  FocalNetForMaskedImageModeling)r  SwinForMaskedImageModeling)r  Swinv2ForMaskedImageModeling)r  ViTForMaskedImageModeling)ry  ImageGPTForCausalImageModeling),)r=   BeitForImageClassification)rL   BitForImageClassification)ro   CLIPForImageClassification)r   ConvNextForImageClassification)r    ConvNextV2ForImageClassification)r   CvtForImageClassification)r   $Data2VecVisionForImageClassification)r   )DeiTForImageClassification%DeiTForImageClassificationWithTeacher)r   DinatForImageClassification)r   Dinov2ForImageClassification)r   )Dinov2WithRegistersForImageClassification)r   DonutSwinForImageClassification)r   )%EfficientFormerForImageClassification0EfficientFormerForImageClassificationWithTeacher)r   "EfficientNetForImageClassification)r  FocalNetForImageClassification)rc  HGNetV2ForImageClassification)rf  HieraForImageClassification)rv  IJepaForImageClassification)ry  ImageGPTForImageClassification)r  )LevitForImageClassification&LevitForImageClassificationWithTeacher)r  !MobileNetV1ForImageClassification)r  !MobileNetV2ForImageClassification)r  MobileViTForImageClassification)r  !MobileViTV2ForImageClassification)r
  NatForImageClassification)r3  )&PerceiverForImageClassificationLearned&PerceiverForImageClassificationFourier-PerceiverForImageClassificationConvProcessing)rH   PoolFormerForImageClassification)rM  PvtForImageClassification)rO  PvtV2ForImageClassification)rk  RegNetForImageClassification)rq  ResNetForImageClassification)r  SegformerForImageClassification)shieldgemma2"ShieldGemma2ForImageClassification)r  SiglipForImageClassification)r  Siglip2ForImageClassification)r  !SwiftFormerForImageClassification)r  SwinForImageClassification)r  Swinv2ForImageClassification)r  TextNetForImageClassification)r  !TimmWrapperForImageClassification)r  VanForImageClassification)r  ViTForImageClassification)r  ViTHybridForImageClassification)r  ViTMSNForImageClassificationr   DetrForSegmentation))r=   BeitForSemanticSegmentation)r   %Data2VecVisionForSemanticSegmentation)r   DPTForSemanticSegmentation)r  "MobileNetV2ForSemanticSegmentation)r   MobileViTForSemanticSegmentation)r  "MobileViTV2ForSemanticSegmentation)r   SegformerForSemanticSegmentation)upernetUperNetForSemanticSegmentationr  !MaskFormerForInstanceSegmentation)r  )eomtEomtForUniversalSegmentation)r  #Mask2FormerForUniversalSegmentationr  )r  !OneFormerForUniversalSegmentation))r  !TimesformerForVideoClassification)r  VideoMAEForVideoClassification)r  VivitForVideoClassification)r  VJEPA2ForVideoClassification)rU   BlipForConditionalGenerationrW   Blip2ForConditionalGenerationre   !ChameleonForConditionalGenerationr  rx  rz  r}  $InstructBlipForConditionalGeneration)r  )InstructBlipVideoForConditionalGenerationr  Kosmos2ForConditionalGenerationr  r  r  r  r  r  r  
pix2struct"Pix2StructForConditionalGenerationrU  "Qwen2_5_VLForConditionalGenerationr]  Qwen2VLForConditionalGenerationr  r  zvision-encoder-decoderVisionEncoderDecoderModelrN  )))r+   AriaForConditionalGeneration)r3   !AyaVisionForConditionalGenerationr  r  r  )r   %Cohere2VisionForConditionalGeneration)r   "DeepseekVLForConditionalGeneration)r   (DeepseekVLHybridForConditionalGeneration)r   Emu3ForConditionalGenerationr_  rH  rl  rM  r  )r8  Glm4vForConditionalGenerationrS  rv  rx  rz  r  )r   InternVLForConditionalGenerationr|  r  r  r  r  r  r  r  r  r  )r7  $PerceptionLMForConditionalGenerationr  )rC  r  r  r  )r  rm  )r  SmolVLMForConditionalGeneration)r  UdopForConditionalGenerationr  r  ).r  rF  r  r  rL  r  rU  rW  rY  r[  r  r  r  re  r  r  rt  r~  r  r  r  MBartForConditionalGenerationr  )r  MegatronBertForMaskedLMr	  )r  ModernBertForMaskedLMr  r  r  r  r  )r3  PerceiverForMaskedLMr  )rh  ReformerForMaskedLMr  r  r  r  r   r  r  r$  r  r  r  r  r(  )
)r   !ConditionalDetrForObjectDetection)r   DFineForObjectDetection)r   DabDetrForObjectDetection)r    DeformableDetrForObjectDetection)r   DetaForObjectDetection)r   DetrForObjectDetection)r  RTDetrForObjectDetection)r  RTDetrV2ForObjectDetection)r  "TableTransformerForObjectDetection)r=  YolosForObjectDetection))r\  GroundingDinoForObjectDetection)r  !MMGroundingDinoForObjectDetectionr  )r%  Owlv2ForObjectDetection)r'  OwlViTForObjectDetection))depth_anythingDepthAnythingForDepthEstimation)r   DepthProForDepthEstimation)r   DPTForDepthEstimation)r=  GLPNForDepthEstimation)prompt_depth_anything%PromptDepthAnythingForDepthEstimation)zoedepthZoeDepthForDepthEstimation)rF  r  )rP   "BlenderbotForConditionalGenerationr  r  ri  rP  granite_speech%GraniteSpeechForConditionalGenerationr  r  r  r  r  )r  MT5ForConditionalGenerationr  r  )r/  PegasusForConditionalGenerationr  r  )rJ  "ProphetNetForConditionalGenerationr  )r  SeamlessM4TForTextToText)r  SeamlessM4Tv2ForTextToTextr  r  r  )r  UMT5ForConditionalGenerationr  )r.  %XLMProphetNetForConditionalGeneration)r  r  )r  *KyutaiSpeechToTextForConditionalGenerationr  r  )r  SeamlessM4TForSpeechToText)r  SeamlessM4Tv2ForSpeechToText)zspeech-encoder-decoderSpeechEncoderDecoderModelr"  )r  SpeechT5ForSpeechToTextr&  )k)r!   AlbertForSequenceClassification)r)   ArceeForSequenceClassification)r:   BartForSequenceClassification)r@   BertForSequenceClassification)rE    BigBirdForSequenceClassification)rG   'BigBirdPegasusForSequenceClassification)rI   BioGptForSequenceClassification)r[   BloomForSequenceClassification)ra   "CamembertForSequenceClassification)rc   CanineForSequenceClassification)r{   LlamaForSequenceClassification)r   !ConvBertForSequenceClassification)r   CTRLForSequenceClassification)r   %Data2VecTextForSequenceClassification)r    DebertaForSequenceClassification)r   "DebertaV2ForSequenceClassification)r   #DeepseekV2ForSequenceClassification)r   "DiffLlamaForSequenceClassification)r   #DistilBertForSequenceClassification)r   DogeForSequenceClassification)r    ElectraForSequenceClassification)r   ErnieForSequenceClassification)r   ErnieMForSequenceClassification)r   EsmForSequenceClassification)r   Exaone4ForSequenceClassification)r  FalconForSequenceClassification)r  !FlaubertForSequenceClassification)r  FNetForSequenceClassification)r  FunnelForSequenceClassification)r   GemmaForSequenceClassification)r"  Gemma2ForSequenceClassification)r$  Gemma3ForSequenceClassification)r2  GlmForSequenceClassification)r4  Glm4ForSequenceClassification)rA  GPT2ForSequenceClassification)rC  rP  )rD  #GPTBigCodeForSequenceClassification)rF  GPTNeoForSequenceClassification)rH   GPTNeoXForSequenceClassification)rN  GPTJForSequenceClassification)r`  HeliumForSequenceClassification)rk  IBertForSequenceClassification)r  JambaForSequenceClassification)r  JetMoeForSequenceClassification)r  !LayoutLMForSequenceClassification)r  #LayoutLMv2ForSequenceClassification)r  #LayoutLMv3ForSequenceClassification)r  LEDForSequenceClassification)r  LiltForSequenceClassification)r  r8  )r  #LongformerForSequenceClassification)r  LukeForSequenceClassification)r  !MarkupLMForSequenceClassification)r  MBartForSequenceClassification)r  MegaForSequenceClassification)r  %MegatronBertForSequenceClassification)r   MiniMaxForSequenceClassification)r   MistralForSequenceClassification)r   MixtralForSequenceClassification)r  #MobileBertForSequenceClassification)r  #ModernBertForSequenceClassification)r  *ModernBertDecoderForSequenceClassification)r  MPNetForSequenceClassification)r  MptForSequenceClassification)r  MraForSequenceClassification)r  MT5ForSequenceClassification)r  MvpForSequenceClassification)r  !NemotronForSequenceClassification)r  NezhaForSequenceClassification)r  &NystromformerForSequenceClassification)r  "OpenLlamaForSequenceClassification)r!  "OpenAIGPTForSequenceClassification)r#  OPTForSequenceClassification)r3  "PerceiverForSequenceClassification)r9  "PersimmonForSequenceClassification)r;  PhiForSequenceClassification)r=  Phi3ForSequenceClassification)rA  PhimoeForSequenceClassification)rE  PLBartForSequenceClassification)rQ   QDQBertForSequenceClassification)rS  Qwen2ForSequenceClassification)r[  !Qwen2MoeForSequenceClassification)ra  Qwen3ForSequenceClassification)rc  !Qwen3MoeForSequenceClassification)rh  !ReformerForSequenceClassification)rn   RemBertForSequenceClassification)rw   RobertaForSequenceClassification)rz  ,RobertaPreLayerNormForSequenceClassification)r}   RoCBertForSequenceClassification)r  !RoFormerForSequenceClassification)r   SmolLM3ForSequenceClassification)r  $SqueezeBertForSequenceClassification)r  !StableLmForSequenceClassification)r  #Starcoder2ForSequenceClassification)r  T5ForSequenceClassification)r   T5GemmaForSequenceClassification)r  TapasForSequenceClassification)r  "TransfoXLForSequenceClassification)r  UMT5ForSequenceClassification)r,  XLMForSequenceClassification)r1  #XLMRobertaForSequenceClassification)r4  %XLMRobertaXLForSequenceClassification)r6  XLNetForSequenceClassification)r:  XmodForSequenceClassification)r?  YosoForSequenceClassification)rA  ZambaForSequenceClassification)rC  Zamba2ForSequenceClassification)L)r!   AlbertForQuestionAnswering)r)   ArceeForQuestionAnswering)r:   BartForQuestionAnswering)r@   BertForQuestionAnswering)rE   BigBirdForQuestionAnswering)rG   "BigBirdPegasusForQuestionAnswering)r[   BloomForQuestionAnswering)ra   CamembertForQuestionAnswering)rc   CanineForQuestionAnswering)r   ConvBertForQuestionAnswering)r    Data2VecTextForQuestionAnswering)r   DebertaForQuestionAnswering)r   DebertaV2ForQuestionAnswering)r   DiffLlamaForQuestionAnswering)r   DistilBertForQuestionAnswering)r   ElectraForQuestionAnswering)r   ErnieForQuestionAnswering)r   ErnieMForQuestionAnswering)r  Exaone4ForQuestionAnswering)r  FalconForQuestionAnswering)r  "FlaubertForQuestionAnsweringSimple)r  FNetForQuestionAnswering)r  FunnelForQuestionAnswering)rC  GPT2ForQuestionAnswering)rF  GPTNeoForQuestionAnswering)rH  GPTNeoXForQuestionAnswering)rN  GPTJForQuestionAnswering)rk  IBertForQuestionAnsweringr  LayoutLMv2ForQuestionAnsweringr  LayoutLMv3ForQuestionAnswering)r  LEDForQuestionAnswering)r  LiltForQuestionAnswering)r  LlamaForQuestionAnswering)r  LongformerForQuestionAnswering)r  LukeForQuestionAnswering)r  LxmertForQuestionAnswering)r  MarkupLMForQuestionAnswering)r  MBartForQuestionAnswering)r  MegaForQuestionAnswering)r   MegatronBertForQuestionAnswering)r  MiniMaxForQuestionAnswering)r  MistralForQuestionAnswering)r  MixtralForQuestionAnswering)r  MobileBertForQuestionAnswering)r  ModernBertForQuestionAnswering)r  MPNetForQuestionAnswering)r  MptForQuestionAnswering)r  MraForQuestionAnswering)r  MT5ForQuestionAnswering)r  MvpForQuestionAnswering)r  NemotronForQuestionAnswering)r  NezhaForQuestionAnswering)r  !NystromformerForQuestionAnswering)r#  OPTForQuestionAnswering)rQ  QDQBertForQuestionAnswering)rS  Qwen2ForQuestionAnswering)r[  Qwen2MoeForQuestionAnswering)ra  Qwen3ForQuestionAnswering)rc  Qwen3MoeForQuestionAnswering)rh  ReformerForQuestionAnswering)rn  RemBertForQuestionAnswering)rw  RobertaForQuestionAnswering)rz  'RobertaPreLayerNormForQuestionAnswering)r}  RoCBertForQuestionAnswering)r  RoFormerForQuestionAnswering)r  SmolLM3ForQuestionAnswering)r  SplinterForQuestionAnswering)r  SqueezeBertForQuestionAnswering)r  T5ForQuestionAnswering)r  UMT5ForQuestionAnswering)r,  XLMForQuestionAnsweringSimple)r1  XLMRobertaForQuestionAnswering)r4   XLMRobertaXLForQuestionAnswering)r6  XLNetForQuestionAnsweringSimple)r:  XmodForQuestionAnswering)r?  YosoForQuestionAnswering)r  TapasForQuestionAnswering))rU   BlipForQuestionAnsweringr  )r  ViltForQuestionAnswering))r  LayoutLMForQuestionAnsweringr  r  )S)r!   AlbertForTokenClassification)r)   ArceeForTokenClassification)r@   BertForTokenClassification)rE   BigBirdForTokenClassification)rI   BioGptForTokenClassification)r[   BloomForTokenClassification)r_   BrosForTokenClassification)ra   CamembertForTokenClassification)rc   CanineForTokenClassification)r   ConvBertForTokenClassification)r   "Data2VecTextForTokenClassification)r   DebertaForTokenClassification)r   DebertaV2ForTokenClassification)r   DiffLlamaForTokenClassification)r    DistilBertForTokenClassification)r   ElectraForTokenClassification)r   ErnieForTokenClassification)r   ErnieMForTokenClassification)r   EsmForTokenClassification)r  Exaone4ForTokenClassification)r  FalconForTokenClassification)r  FlaubertForTokenClassification)r  FNetForTokenClassification)r  FunnelForTokenClassification)r   GemmaForTokenClassification)r"  Gemma2ForTokenClassification)r2  GlmForTokenClassification)r4  Glm4ForTokenClassification)rA  GPT2ForTokenClassification)rC  r  )rD   GPTBigCodeForTokenClassification)rF  GPTNeoForTokenClassification)rH  GPTNeoXForTokenClassification)r`  HeliumForTokenClassification)rk  IBertForTokenClassification)r  LayoutLMForTokenClassification)r   LayoutLMv2ForTokenClassification)r   LayoutLMv3ForTokenClassification)r  LiltForTokenClassification)r  LlamaForTokenClassification)r   LongformerForTokenClassification)r  LukeForTokenClassification)r  MarkupLMForTokenClassification)r  MegaForTokenClassification)r  "MegatronBertForTokenClassification)r  MiniMaxForTokenClassification)r  MistralForTokenClassification)r  MixtralForTokenClassification)r   MobileBertForTokenClassification)r   ModernBertForTokenClassification)r  MPNetForTokenClassification)r  MptForTokenClassification)r  MraForTokenClassification)r  MT5ForTokenClassification)r  NemotronForTokenClassification)r  NezhaForTokenClassification)r  #NystromformerForTokenClassification)r9  PersimmonForTokenClassification)r;  PhiForTokenClassification)r=  Phi3ForTokenClassification)rQ  QDQBertForTokenClassification)rS  Qwen2ForTokenClassification)r[  Qwen2MoeForTokenClassification)ra  Qwen3ForTokenClassification)rc  Qwen3MoeForTokenClassification)rn  RemBertForTokenClassification)rw  RobertaForTokenClassification)rz  )RobertaPreLayerNormForTokenClassification)r}  RoCBertForTokenClassification)r  RoFormerForTokenClassification)r  SmolLM3ForTokenClassification)r  !SqueezeBertForTokenClassification)r  StableLmForTokenClassification)r   Starcoder2ForTokenClassification)r  T5ForTokenClassification)r  T5GemmaForTokenClassification)r  UMT5ForTokenClassification)r,  XLMForTokenClassification)r1   XLMRobertaForTokenClassification)r4  "XLMRobertaXLForTokenClassification)r6  XLNetForTokenClassification)r:  XmodForTokenClassification)r?  YosoForTokenClassification)')r!   AlbertForMultipleChoice)r@   BertForMultipleChoice)rE   BigBirdForMultipleChoice)ra   CamembertForMultipleChoice)rc   CanineForMultipleChoice)r   ConvBertForMultipleChoice)r   Data2VecTextForMultipleChoice)r   DebertaV2ForMultipleChoice)r   DistilBertForMultipleChoice)r   ElectraForMultipleChoice)r   ErnieForMultipleChoice)r   ErnieMForMultipleChoice)r  FlaubertForMultipleChoice)r  FNetForMultipleChoice)r  FunnelForMultipleChoice)rk  IBertForMultipleChoice)r  LongformerForMultipleChoice)r  LukeForMultipleChoice)r  MegaForMultipleChoice)r  MegatronBertForMultipleChoice)r  MobileBertForMultipleChoice)r  ModernBertForMultipleChoice)r  MPNetForMultipleChoice)r  MraForMultipleChoice)r  NezhaForMultipleChoice)r  NystromformerForMultipleChoice)rQ  QDQBertForMultipleChoice)rn  RemBertForMultipleChoice)rw  RobertaForMultipleChoice)rz  $RobertaPreLayerNormForMultipleChoice)r}  RoCBertForMultipleChoice)r  RoFormerForMultipleChoice)r  SqueezeBertForMultipleChoice)r,  XLMForMultipleChoice)r1  XLMRobertaForMultipleChoice)r4  XLMRobertaXLForMultipleChoice)r6  XLNetForMultipleChoice)r:  XmodForMultipleChoice)r?  YosoForMultipleChoice))r@   BertForNextSentencePrediction)r   ErnieForNextSentencePrediction)r  FNetForNextSentencePrediction)r  %MegatronBertForNextSentencePrediction)r  #MobileBertForNextSentencePrediction)r  NezhaForNextSentencePrediction)rQ   QDQBertForNextSentencePrediction))r/   ASTForAudioClassification)r   &Data2VecAudioForSequenceClassification)rh  HubertForSequenceClassification)r  SEWForSequenceClassification)r  SEWDForSequenceClassification)r  "UniSpeechForSequenceClassification)r  %UniSpeechSatForSequenceClassification)r  !Wav2Vec2ForSequenceClassification)r  %Wav2Vec2BertForSequenceClassification)r!  *Wav2Vec2ConformerForSequenceClassification)r#  WavLMForSequenceClassification)r%  WhisperForAudioClassification))r   Data2VecAudioForCTC)rh  HubertForCTC)r  MCTCTForCTC)r  	SEWForCTC)r  
SEWDForCTC)r  UniSpeechForCTC)r  UniSpeechSatForCTC)r  Wav2Vec2ForCTC)r  Wav2Vec2BertForCTC)r!  Wav2Vec2ConformerForCTC)r#  WavLMForCTC))r   (Data2VecAudioForAudioFrameClassification)r  'UniSpeechSatForAudioFrameClassification)r  #Wav2Vec2ForAudioFrameClassification)r  'Wav2Vec2BertForAudioFrameClassification)r!  ,Wav2Vec2ConformerForAudioFrameClassification)r#   WavLMForAudioFrameClassification))r   Data2VecAudioForXVector)r  UniSpeechSatForXVector)r  Wav2Vec2ForXVector)r  Wav2Vec2BertForXVector)r!  Wav2Vec2ConformerForXVector)r#  WavLMForXVectorr	  )r  SpeechT5ForTextToSpeech)
r7   r   )r
  r  r  )r   MusicgenForConditionalGeneration)r  &MusicgenMelodyForConditionalGeneration)qwen2_5_omni#Qwen2_5OmniForConditionalGeneration)r  SeamlessM4TForTextToSpeech)r  SeamlessM4Tv2ForTextToSpeechr  )	r#   r&   rT   )rW   Blip2ForImageTextRetrievalrg   rn   rv   r  r  ))r=   BeitBackbone)rL   BitBackbone)r   ConvNextBackbone)r   ConvNextV2Backbone)r   DinatBackbone)r   Dinov2Backbone)r   Dinov2WithRegistersBackbone)r  FocalNetBackbonerb  )rf  HieraBackbone)r  MaskFormerSwinBackbone)r
  NatBackbone)rO  PvtV2Backbone)rq  ResNetBackbone)rt_detr_resnetRTDetrResNetBackbone)r  SwinBackbone)r  Swinv2Backbone)r  TextNetBackboner  )r  VitDetBackbone)vitpose_backboneVitPoseBackboner  r  )
superpointSuperPointForKeypointDetection))r   !EfficientLoFTRForKeypointMatchingr  )	superglueSuperGlueForKeypointMatching)r    r?   rD   rq   r   r   r   r   r   )r   Emu3TextModelr  rj  )r  r  r  )r  MllamaTextModelr  )r  MT5EncoderModelr  rg  rm  rv  ry  r|  r  r  )r  T5EncoderModel)r  T5GemmaEncoderModel)r  UMT5EncoderModelr+  r0  r3  )r+  'PatchTSMixerForTimeSeriesClassification)r-  PatchTSTForClassification)r+  PatchTSMixerForRegression)r-  PatchTSTForRegression)r  TimesFmModelForPrediction)r  Swin2SRForImageSuperResolutionr   c                       \ rS rSr\rSrg)AutoModelForMaskGenerationi+  r   N)r   r   r   r   !MODEL_FOR_MASK_GENERATION_MAPPING_model_mappingr   r   r   r   r  r  +      6Nr   r  c                       \ rS rSr\rSrg)AutoModelForKeypointDetectioni/  r   N)r   r   r   r   $MODEL_FOR_KEYPOINT_DETECTION_MAPPINGr  r   r   r   r   r  r  /      9Nr   r  c                       \ rS rSr\rSrg)AutoModelForKeypointMatchingi3  r   N)r   r   r   r   #MODEL_FOR_KEYPOINT_MATCHING_MAPPINGr  r   r   r   r   r  r  3  s    8Nr   r  c                       \ rS rSr\rSrg)AutoModelForTextEncodingi7  r   N)r   r   r   r   MODEL_FOR_TEXT_ENCODING_MAPPINGr  r   r   r   r   r  r  7      4Nr   r  c                       \ rS rSr\rSrg)AutoModelForImageToImagei;  r   N)r   r   r   r    MODEL_FOR_IMAGE_TO_IMAGE_MAPPINGr  r   r   r   r   r  r  ;  s    5Nr   r  c                       \ rS rSr\rSrg)	AutoModeli?  r   N)r   r   r   r   MODEL_MAPPINGr  r   r   r   r   r  r  ?  s    "Nr   r  c                       \ rS rSr\rSrg)AutoModelForPreTrainingiF  r   N)r   r   r   r   MODEL_FOR_PRETRAINING_MAPPINGr  r   r   r   r   r  r  F  s    2Nr   r  pretraining)head_docc                       \ rS rSr\rSrg)_AutoModelWithLMHeadiN  r   N)r   r   r   r   MODEL_WITH_LM_HEAD_MAPPINGr  r   r   r   r   r  r  N      /Nr   r  zlanguage modelingc                   p   ^  \ rS rSr\r\S\S    S\\	\
R                  \	   4   SS4U 4S jj5       rSrU =r$ )AutoModelForCausalLMiU  clspretrained_model_name_or_pathreturnr   c                 ,   > [         TU ]  " U/UQ70 UD6$ Nsuperfrom_pretrainedr  r  
model_argskwargs	__class__s       r   r  $AutoModelForCausalLM.from_pretrainedY  !     w&'D\z\U[\\r   r   )r   r   r   r   MODEL_FOR_CAUSAL_LM_MAPPINGr  classmethodtyper   strosPathLiker  r   __classcell__r  s   @r   r  r  U  sT    0N ]()]',S"++c2B-B'C]
 
"] ]r   r  zcausal language modelingc                       \ rS rSr\rSrg)AutoModelForMaskedLMif  r   N)r   r   r   r   MODEL_FOR_MASKED_LM_MAPPINGr  r   r   r   r   r  r  f  s    0Nr   r  zmasked language modelingc                       \ rS rSr\rSrg)AutoModelForSeq2SeqLMim  r   N)r   r   r   r   &MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPINGr  r   r   r   r   r  r  m      ;Nr   r  z&sequence-to-sequence language modelingzgoogle-t5/t5-base)r  checkpoint_for_examplec                       \ rS rSr\rSrg)"AutoModelForSequenceClassificationix  r   N)r   r   r   r   )MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPINGr  r   r   r   r   r  r  x  s    >Nr   r  zsequence classificationc                       \ rS rSr\rSrg)AutoModelForQuestionAnsweringi  r   N)r   r   r   r   $MODEL_FOR_QUESTION_ANSWERING_MAPPINGr  r   r   r   r   r  r    r  r   r  zquestion answeringc                       \ rS rSr\rSrg)"AutoModelForTableQuestionAnsweringi  r   N)r   r   r   r   *MODEL_FOR_TABLE_QUESTION_ANSWERING_MAPPINGr  r   r   r   r   r   r         ?Nr   r   ztable question answeringzgoogle/tapas-base-finetuned-wtqc                       \ rS rSr\rSrg)#AutoModelForVisualQuestionAnsweringi  r   N)r   r   r   r   +MODEL_FOR_VISUAL_QUESTION_ANSWERING_MAPPINGr  r   r   r   r   r  r    s    @Nr   r  zvisual question answeringzdandelin/vilt-b32-finetuned-vqac                       \ rS rSr\rSrg)%AutoModelForDocumentQuestionAnsweringi  r   N)r   r   r   r   -MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPINGr  r   r   r   r   r  r    s    BNr   r  zdocument question answeringz/impira/layoutlm-document-qa", revision="52e01b3c                       \ rS rSr\rSrg)AutoModelForTokenClassificationi  r   N)r   r   r   r   &MODEL_FOR_TOKEN_CLASSIFICATION_MAPPINGr  r   r   r   r   r
  r
    r  r   r
  ztoken classificationc                       \ rS rSr\rSrg)AutoModelForMultipleChoicei  r   N)r   r   r   r   !MODEL_FOR_MULTIPLE_CHOICE_MAPPINGr  r   r   r   r   r  r    r  r   r  zmultiple choicec                       \ rS rSr\rSrg)"AutoModelForNextSentencePredictioni  r   N)r   r   r   r   *MODEL_FOR_NEXT_SENTENCE_PREDICTION_MAPPINGr  r   r   r   r   r  r    r  r   r  znext sentence predictionc                       \ rS rSr\rSrg)AutoModelForImageClassificationi  r   N)r   r   r   r   &MODEL_FOR_IMAGE_CLASSIFICATION_MAPPINGr  r   r   r   r   r  r    r  r   r  zimage classificationc                       \ rS rSr\rSrg)'AutoModelForZeroShotImageClassificationi  r   N)r   r   r   r   0MODEL_FOR_ZERO_SHOT_IMAGE_CLASSIFICATION_MAPPINGr  r   r   r   r   r  r    s    ENr   r  zzero-shot image classificationc                       \ rS rSr\rSrg)AutoModelForImageSegmentationi  r   N)r   r   r   r   $MODEL_FOR_IMAGE_SEGMENTATION_MAPPINGr  r   r   r   r   r  r    r  r   r  zimage segmentationc                       \ rS rSr\rSrg) AutoModelForSemanticSegmentationi  r   N)r   r   r   r   'MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPINGr  r   r   r   r   r  r        <Nr   r  zsemantic segmentationc                       \ rS rSr\rSrg) AutoModelForTimeSeriesPredictioni  r   N)r   r   r   r   (MODEL_FOR_TIME_SERIES_PREDICTION_MAPPINGr  r   r   r   r   r   r         =Nr   r   ztime-series predictionc                       \ rS rSr\rSrg)!AutoModelForUniversalSegmentationi  r   N)r   r   r   r   (MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPINGr  r   r   r   r   r$  r$    r"  r   r$  zuniversal image segmentationc                       \ rS rSr\rSrg) AutoModelForInstanceSegmentationi  r   N)r   r   r   r   'MODEL_FOR_INSTANCE_SEGMENTATION_MAPPINGr  r   r   r   r   r'  r'    r  r   r'  zinstance segmentationc                       \ rS rSr\rSrg)AutoModelForObjectDetectioni  r   N)r   r   r   r   "MODEL_FOR_OBJECT_DETECTION_MAPPINGr  r   r   r   r   r*  r*        7Nr   r*  zobject detectionc                       \ rS rSr\rSrg)#AutoModelForZeroShotObjectDetectioni  r   N)r   r   r   r   ,MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPINGr  r   r   r   r   r.  r.        ANr   r.  zzero-shot object detectionc                       \ rS rSr\rSrg)AutoModelForDepthEstimationi  r   N)r   r   r   r   "MODEL_FOR_DEPTH_ESTIMATION_MAPPINGr  r   r   r   r   r2  r2    r,  r   r2  zdepth estimationc                       \ rS rSr\rSrg)AutoModelForVideoClassificationi  r   N)r   r   r   r   &MODEL_FOR_VIDEO_CLASSIFICATION_MAPPINGr  r   r   r   r   r5  r5    r  r   r5  zvideo classificationc                       \ rS rSr\rSrg)_AutoModelForVision2Seqi  r   N)r   r   r   r   MODEL_FOR_VISION_2_SEQ_MAPPINGr  r   r   r   r   r8  r8    s    3Nr   r8  zvision-to-text modelingc                   p   ^  \ rS rSr\r\S\S    S\\	\
R                  \	   4   SS4U 4S jj5       rSrU =r$ )AutoModelForImageTextToTexti!  r  r  r  r   c                 ,   > [         TU ]  " U/UQ70 UD6$ r  r  r  s       r   r  +AutoModelForImageTextToText.from_pretrained%  r  r   r   )r   r   r   r   $MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPINGr  r  r  r   r  r  r  r  r   r  r  s   @r   r;  r;  !  sT    9N ]/0]',S"++c2B-B'C]
 
"] ]r   r;  zimage-text-to-text modelingc                       \ rS rSr\rSrg)AutoModelForAudioClassificationi2  r   N)r   r   r   r   &MODEL_FOR_AUDIO_CLASSIFICATION_MAPPINGr  r   r   r   r   r@  r@  2  r  r   r@  zaudio classificationc                       \ rS rSr\rSrg)AutoModelForCTCi9  r   N)r   r   r   r   MODEL_FOR_CTC_MAPPINGr  r   r   r   r   rC  rC  9  s    *Nr   rC  z%connectionist temporal classificationc                       \ rS rSr\rSrg)AutoModelForSpeechSeq2Seqi@  r   N)r   r   r   r   "MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPINGr  r   r   r   r   rF  rF  @  r,  r   rF  z,sequence-to-sequence speech-to-text modelingc                       \ rS rSr\rSrg)$AutoModelForAudioFrameClassificationiI  r   N)r   r   r   r   ,MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPINGr  r   r   r   r   rI  rI  I  r0  r   rI  z"audio frame (token) classificationc                       \ rS rSr\rSrg)AutoModelForAudioXVectoriR  r   N)r   r   r   r   MODEL_FOR_AUDIO_XVECTOR_MAPPINGr  r   r   r   r   rL  rL  R  r  r   rL  c                       \ rS rSr\rSrg)AutoModelForTextToSpectrogramiV  r   N)r   r   r   r   %MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPINGr  r   r   r   r   rO  rO  V  s    :Nr   rO  c                       \ rS rSr\rSrg)AutoModelForTextToWaveformiZ  r   N)r   r   r   r   "MODEL_FOR_TEXT_TO_WAVEFORM_MAPPINGr  r   r   r   r   rR  rR  Z  r,  r   rR  c                       \ rS rSr\rSrg)AutoBackbonei^  r   N)r   r   r   r   MODEL_FOR_BACKBONE_MAPPINGr  r   r   r   r   rU  rU  ^  r  r   rU  zaudio retrieval via x-vectorc                       \ rS rSr\rSrg)AutoModelForMaskedImageModelingie  r   N)r   r   r   r   'MODEL_FOR_MASKED_IMAGE_MODELING_MAPPINGr  r   r   r   r   rX  rX  e  r  r   rX  zmasked image modelingc                       \ rS rSr\rSrg)AutoModelForAudioTokenizationil  r   N)r   r   r   r   $MODEL_FOR_AUDIO_TOKENIZATION_MAPPINGr  r   r   r   r   r[  r[  l  r  r   r[  z$audio tokenization through codebooksc                   H   ^  \ rS rSr\U 4S j5       r\U 4S j5       rSrU =r$ )AutoModelWithLMHeadiu  c                 X   > [         R                  " S[        5        [        TU ]  U5      $ NzThe class `AutoModelWithLMHead` is deprecated and will be removed in a future version. Please use `AutoModelForCausalLM` for causal language models, `AutoModelForMaskedLM` for masked language models and `AutoModelForSeq2SeqLM` for encoder-decoder models.warningswarnFutureWarningr  from_configr  configr  s     r   re  AutoModelWithLMHead.from_configv  s,    B 		
 w"6**r   c                 b   > [         R                  " S[        5        [        TU ]  " U/UQ70 UD6$ r`  rb  rc  rd  r  r  r  s       r   r  #AutoModelWithLMHead.from_pretrained  s8    B 		
 w&'D\z\U[\\r   r   	r   r   r   r   r  re  r  r   r  r  s   @r   r^  r^  u  s+    + + ] ]r   r^  c                   H   ^  \ rS rSr\U 4S j5       r\U 4S j5       rSrU =r$ )AutoModelForVision2Seqi  c                 X   > [         R                  " S[        5        [        TU ]  U5      $ NzThe class `AutoModelForVision2Seq` is deprecated and will be removed in v5.0. Please use `AutoModelForImageTextToText` instead.ra  rf  s     r   re  "AutoModelForVision2Seq.from_config  s)    5	

 w"6**r   c                 b   > [         R                  " S[        5        [        TU ]  " U/UQ70 UD6$ rp  rj  r  s       r   r  &AutoModelForVision2Seq.from_pretrained  s5    5	

 w&'D\z\U[\\r   r   rl  r  s   @r   rn  rn    s+    + + ] ]r   rn  )YrA  rJ  r\  rM  rV  'MODEL_FOR_CAUSAL_IMAGE_MODELING_MAPPINGr  rD  r  r3  r  MODEL_FOR_IMAGE_MAPPINGr  r  r  r  r(  rY  r  r  r  r  r+  r  r  r  r  r  rG  r  r  rS  rP  r!  r  r%  r6  r9  MODEL_FOR_RETRIEVAL_MAPPINGr>  r  r  r  r  r/  ,MODEL_FOR_TIME_SERIES_CLASSIFICATION_MAPPING(MODEL_FOR_TIME_SERIES_REGRESSION_MAPPINGr  rU  r@  rI  r[  rL  r  rC  r2  r  r  r  r'  r  r  r  r  rX  r  r  r  r*  r  r  r  r  r  rF  r   rO  rR  r   r
  r$  r5  rn  r  r  r^  r  r.  r;  )__doc__r  rb  collectionsr   typingr   r   utilsr   auto_factoryr	   r
   r   r   configuration_autor   
generationr   modeling_utilsr   r   
get_loggerr   loggerMODEL_MAPPING_NAMES#MODEL_FOR_PRETRAINING_MAPPING_NAMES MODEL_WITH_LM_HEAD_MAPPING_NAMES!MODEL_FOR_CAUSAL_LM_MAPPING_NAMESMODEL_FOR_IMAGE_MAPPING_NAMES-MODEL_FOR_MASKED_IMAGE_MODELING_MAPPING_NAMES-MODEL_FOR_CAUSAL_IMAGE_MODELING_MAPPING_NAMES,MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMES*MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES-MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES-MODEL_FOR_INSTANCE_SEGMENTATION_MAPPING_NAMES.MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMES,MODEL_FOR_VIDEO_CLASSIFICATION_MAPPING_NAMES$MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES!MODEL_FOR_RETRIEVAL_MAPPING_NAMES*MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES!MODEL_FOR_MASKED_LM_MAPPING_NAMES(MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES2MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMES(MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMES,MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES(MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES/MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMES*MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMES0MODEL_FOR_TABLE_QUESTION_ANSWERING_MAPPING_NAMES1MODEL_FOR_VISUAL_QUESTION_ANSWERING_MAPPING_NAMES3MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMES,MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMES'MODEL_FOR_MULTIPLE_CHOICE_MAPPING_NAMES0MODEL_FOR_NEXT_SENTENCE_PREDICTION_MAPPING_NAMES,MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMESMODEL_FOR_CTC_MAPPING_NAMES2MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMES%MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMES+MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMES(MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMES6MODEL_FOR_ZERO_SHOT_IMAGE_CLASSIFICATION_MAPPING_NAMES MODEL_FOR_BACKBONE_MAPPING_NAMES'MODEL_FOR_MASK_GENERATION_MAPPING_NAMES*MODEL_FOR_KEYPOINT_DETECTION_MAPPING_NAMES)MODEL_FOR_KEYPOINT_MATCHING_MAPPING_NAMES%MODEL_FOR_TEXT_ENCODING_MAPPING_NAMES2MODEL_FOR_TIME_SERIES_CLASSIFICATION_MAPPING_NAMES.MODEL_FOR_TIME_SERIES_REGRESSION_MAPPING_NAMES.MODEL_FOR_TIME_SERIES_PREDICTION_MAPPING_NAMES&MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMES"MODEL_FOR_AUDIO_TOKENIZATION_NAMESr  r  r  r  rt  r  r  r  r  r(  r%  r6  r9  r>  rv  r  r  r  ru  rY  r+  r/  r3  r  r  r  r  r  r  r  rA  rD  rG  rJ  rM  rP  rS  rV  r  r  r  r  rw  rx  r!  r  r\  r  r  r  r  r  r  r  r  r  r  r  r  r  r   r  r  r
  r  r  r  r  r  r  r   r$  r'  r*  r.  r2  r5  r8  r;  r@  rC  rF  rI  rL  rO  rR  rU  rX  r[  r^  rn  __all__r   r   r   <module>r     s    	  # '   5 -1/  
		H	%!gi V '2Y[' #z $/VX$  t %0BD% !L !,;=! ~ 1<1 - 1< 	71 - 0;AC0 ,J .9 	(. * 1<
1 - 1< 	<1 - 2=	2 . 0;0 , (3( $6 %0*% ! .9*,. *\ %002% !h ,7, (  6A	6 2 ,7
, ( 0;!0 ,F ,7, (  3>mo3 /b .9NP. *d 4? 	/4 0 5@5 1 7B7 3 0;UW0 ,r +6)++ 'Z 4?
4 0 0;0 ,$ * " 6A
6 2 )4
) % /: 	?// + ,7, (  :E: 6 $/$  6 +6 + ' .98. * -8- ) )4 ") %H 6AC16 2 2=5-2 . 2=02 . *55* & &1& " !!57JK 01EGj k -.BDde ./CEfg *:G+ ' *:F* & 4DP4 0 (8D( $ +;G+ ' +;G+ ' ,<H, ( *:F* & "22FHl!m '7D( $ //CEfg .>K/ + 1AM1 - //CEfg *+?A^_ *:G+ ' &66JLt%u "/?L0 , &66JLt%u ")9F* & -=I- ) (8D( $ .>J. * *:F* & %55IKr$s !-=J. * *:F* & ))=?Z[ %56JLt%u "/?L0 , #33GIn"o (8E) % &66JLt%u "-.BDde $45IKr$s !'7D( $ '77KMv&w #"23GIn"o /?L0 , ,<H, ( ,<H, ( $44HJp#q  '78LNp'q $7!4 7:$7 :9#6 952 562 6## # i(	31 3 ,,Cm\ 0. 0 ))=H[\ ]. ] ))=Hbc 1. 1 ))=Hbc </ < *5. ?)< ? &7&1J& "
:$7 : !22OZn o @)< @ &7&'<& "A*= A '8'(<' #C,? C ):)*L) %<&9 < #44S^t"u 7!4 7 //ITef @)< @ &7&1K& "
<&9 < #44S^t"u F.A F +<+6V+ '
:$7 : !22OZn o =': = $5$/F$  
>': > $5$/G$  
>(; > %6%0N% !
=': = $5$/F$  
8"5 8 00KVhi B*= B '8'2N' #
8"5 8 00KVhi <&9 < #44S^t"u 41 4 ,,CNgh ]"5 ] 00KVst <&9 < #44S^t"u +) + $O>ef8 3 8 .(V 
B+> B (9(3W( $
52 5;$7 ;8!4 80) 0 --EPno =&9 = #44S^u"v :$7 : !2!,R! 
]. ],]4 ](Zr   