ó
    <±hº  ã                   óv  • S r SSKJrJrJr  SSKrSSKrSSKJr  SSKJ	r	J
r
Jr  SSKJr  SSKJr  SS	KJrJrJrJrJrJr  SS
KJrJr  SSKJrJrJr  SSKJrJ r J!r!  SSK"J#r#  \!RH                  " \%5      r&\RN                  r( " S S\RR                  5      r*  S@S\RR                  S\RV                  S\RV                  S\RV                  S\\RV                     S\,S\,S\\RV                     4S jjr- " S S\RR                  5      r. " S S\RR                  5      r/ " S S\RR                  5      r0 " S  S!\RR                  5      r1 " S" S#\RR                  5      r2 " S$ S%\5      r3 " S& S'\RR                  5      r4 " S( S)\RR                  5      r5 " S* S+\RR                  5      r6 " S, S-\RR                  5      r7 " S. S/\RR                  5      r8\ " S0 S1\5      5       r9\ " S2 S3\95      5       r:\ " S4 S5\95      5       r;\" S6S79 " S8 S9\95      5       r<\" S:S79 " S; S<\95      5       r=\ " S= S>\95      5       r>/ S?Qr?g)AzPyTorch LayoutLM model.é    )ÚCallableÚOptionalÚUnionN)Únn)ÚBCEWithLogitsLossÚCrossEntropyLossÚMSELossé   )ÚACT2FN)ÚGradientCheckpointingLayer)ÚBaseModelOutputÚBaseModelOutputWithPoolingÚMaskedLMOutputÚQuestionAnsweringModelOutputÚSequenceClassifierOutputÚTokenClassifierOutput)ÚALL_ATTENTION_FUNCTIONSÚPreTrainedModel)Úapply_chunking_to_forwardÚ find_pruneable_heads_and_indicesÚprune_linear_layer)Úauto_docstringÚcan_return_tupleÚloggingé   )ÚLayoutLMConfigc                   ó@   ^ • \ rS rSrSrU 4S jr     SS jrSrU =r$ )ÚLayoutLMEmbeddingsé.   zGConstruct the embeddings from word, position and token_type embeddings.c                 óà  >• [         TU ]  5         [        R                  " UR                  UR
                  UR                  S9U l        [        R                  " UR                  UR
                  5      U l	        [        R                  " UR                  UR
                  5      U l        [        R                  " UR                  UR
                  5      U l        [        R                  " UR                  UR
                  5      U l        [        R                  " UR                  UR
                  5      U l        [        R                  " UR                  UR
                  5      U l        [#        UR
                  UR$                  S9U l        [        R(                  " UR*                  5      U l        U R/                  S[0        R2                  " UR                  5      R5                  S5      SS9  g )N)Úpadding_idx©ÚepsÚposition_ids)r   éÿÿÿÿF)Ú
persistent)ÚsuperÚ__init__r   Ú	EmbeddingÚ
vocab_sizeÚhidden_sizeÚpad_token_idÚword_embeddingsÚmax_position_embeddingsÚposition_embeddingsÚmax_2d_position_embeddingsÚx_position_embeddingsÚy_position_embeddingsÚh_position_embeddingsÚw_position_embeddingsÚtype_vocab_sizeÚtoken_type_embeddingsÚLayoutLMLayerNormÚlayer_norm_epsÚ	LayerNormÚDropoutÚhidden_dropout_probÚdropoutÚregister_bufferÚtorchÚarangeÚexpand©ÚselfÚconfigÚ	__class__s     €Úf/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/layoutlm/modeling_layoutlm.pyr(   ÚLayoutLMEmbeddings.__init__1   s[  ø€ Ü‰ÑÔÜ!Ÿ|š|¨F×,=Ñ,=¸v×?QÑ?QÐ_e×_rÑ_rÑsˆÔÜ#%§<¢<°×0NÑ0NÐPV×PbÑPbÓ#cˆÔ Ü%'§\¢\°&×2SÑ2SÐU[×UgÑUgÓ%hˆÔ"Ü%'§\¢\°&×2SÑ2SÐU[×UgÑUgÓ%hˆÔ"Ü%'§\¢\°&×2SÑ2SÐU[×UgÑUgÓ%hˆÔ"Ü%'§\¢\°&×2SÑ2SÐU[×UgÑUgÓ%hˆÔ"Ü%'§\¢\°&×2HÑ2HÈ&×J\ÑJ\Ó%]ˆÔ"ä*¨6×+=Ñ+=À6×CXÑCXÑYˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒà×ÑØœEŸLšL¨×)GÑ)GÓH×OÑOÐPWÓXÐejð 	ò 	
ó    c                 ó°  • Ub  UR                  5       nOUR                  5       S S nUS   nUb  UR                  OUR                  nUc  U R                  S S 2S U24   nUc$  [        R                  " U[        R
                  US9nUc  U R                  U5      nUn	U R                  U5      n
 U R                  US S 2S S 2S4   5      nU R                  US S 2S S 2S4   5      nU R                  US S 2S S 2S4   5      nU R                  US S 2S S 2S4   5      nU R                  US S 2S S 2S4   US S 2S S 2S4   -
  5      nU R                  US S 2S S 2S4   US S 2S S 2S4   -
  5      nU R                  U5      nU	U
-   U-   U-   U-   U-   U-   U-   U-   nU R                  U5      nU R                  U5      nU$ ! [         a  n[        S5      UeS nAff = f)Nr%   r   ©ÚdtypeÚdevicer   é   r
   z:The `bbox`coordinate values should be within 0-1000 range.)ÚsizerK   r$   r>   ÚzerosÚlongr-   r/   r1   r2   Ú
IndexErrorr3   r4   r6   r9   r<   )rB   Ú	input_idsÚbboxÚtoken_type_idsr$   Úinputs_embedsÚinput_shapeÚ
seq_lengthrK   Úwords_embeddingsr/   Úleft_position_embeddingsÚupper_position_embeddingsÚright_position_embeddingsÚlower_position_embeddingsÚer3   r4   r6   Ú
embeddingss                       rE   ÚforwardÚLayoutLMEmbeddings.forwardB   s1  € ð Ñ Ø#Ÿ.™.Ó*‰Kà'×,Ñ,Ó.¨s°Ð3ˆKà  ‘^ˆ
à%.Ñ%:×!Ò!À×@TÑ@TˆàÑØ×,Ñ,ªQ°°°¨^Ñ<ˆLàÑ!Ü"Ÿ[š[¨¼E¿J¹JÈvÑVˆNàÑ Ø ×0Ñ0°Ó;ˆMà(ÐØ"×6Ñ6°|ÓDÐð	bØ'+×'AÑ'AÀ$ÂqÊ!ÈQÀwÁ-Ó'PÐ$Ø(,×(BÑ(BÀ4ÊÊ1ÈaÈÁ=Ó(QÐ%Ø(,×(BÑ(BÀ4ÊÊ1ÈaÈÁ=Ó(QÐ%Ø(,×(BÑ(BÀ4ÊÊ1ÈaÈÁ=Ó(QÐ%ð !%× :Ñ :¸4ÂÂ1ÀaÀ¹=È4ÒPQÒSTÐVWÐPWÉ=Ñ;XÓ YÐØ $× :Ñ :¸4ÂÂ1ÀaÀ¹=È4ÒPQÒSTÐVWÐPWÉ=Ñ;XÓ YÐØ $× :Ñ :¸>Ó JÐð Ø!ñ"à&ñ'ð (ñ(ð (ñ	(ð
 (ñ(ð $ñ$ð $ñ$ð $ñ$ð 	ð —^‘^ JÓ/ˆ
Ø—\‘\ *Ó-ˆ
ØÐøô) ó 	bÜÐYÓZÐ`aÐaûð	bús   Â/A,F: Æ:
GÇGÇG)	r9   r<   r3   r/   r6   r4   r-   r1   r2   )NNNNN)	Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__r(   r^   Ú__static_attributes__Ú__classcell__©rD   s   @rE   r   r   .   s&   ø† ÙQõ
ð& ØØØØ÷5ò 5rG   r   ÚmoduleÚqueryÚkeyÚvalueÚattention_maskÚscalingr<   Ú	head_maskc                 ó  • [         R                  " XR                  SS5      5      U-  n	Ub"  US S 2S S 2S S 2S UR                  S   24   n
Xš-   n	[        R
                  R                  U	S[         R                  S9R                  UR                  5      n	[        R
                  R                  X–U R                  S9n	Ub  X—R                  SSSS5      -  n	[         R                  " X“5      nUR                  SS5      R                  5       nX¹4$ )NrL   r
   éþÿÿÿr%   )ÚdimrJ   )ÚpÚtrainingr   )r>   ÚmatmulÚ	transposeÚshaper   Ú
functionalÚsoftmaxÚfloat32ÚtorJ   r<   rs   ÚviewÚ
contiguous)rh   ri   rj   rk   rl   rm   r<   rn   ÚkwargsÚattn_weightsÚcausal_maskÚattn_outputs               rE   Úeager_attention_forwardr   {   sì   € ô —<’< §}¡}°Q¸Ó':Ó;¸gÑE€LØÑ!Ø$¢Qªª1¨o°·	±	¸"±¨oÐ%=Ñ>ˆØ#Ñ1ˆä—=‘=×(Ñ(¨¸2ÄUÇ]Á]Ð(ÐS×VÑVÐW\×WbÑWbÓc€LÜ—=‘=×(Ñ(¨È6Ï?É?Ð(Ð[€LàÑØ#§n¡n°Q¸¸A¸qÓ&AÑAˆä—,’,˜|Ó3€KØ×'Ñ'¨¨1Ó-×8Ñ8Ó:€KØÐ$Ð$rG   c                   ó¸   ^ • \ rS rSrU 4S jr   S
S\R                  S\\R                     S\\R                     S\\	   S\
\R                     4
S jjrS	rU =r$ )ÚLayoutLMSelfAttentioné—   c                 ó6  >• [         TU ]  5         UR                  UR                  -  S:w  a7  [	        US5      (       d&  [        SUR                   SUR                   S35      eXl        UR                  U l        [        UR                  UR                  -  5      U l        U R                  U R                  -  U l	        [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        [        R                  " UR                   5      U l        UR                   U l        U R                  S-  U l        g )Nr   Úembedding_sizezThe hidden size (z6) is not a multiple of the number of attention heads (Ú)g      à¿)r'   r(   r+   Únum_attention_headsÚhasattrÚ
ValueErrorrC   ÚintÚattention_head_sizeÚall_head_sizer   ÚLinearri   rj   rk   r:   Úattention_probs_dropout_probr<   Úattention_dropoutrm   rA   s     €rE   r(   ÚLayoutLMSelfAttention.__init__˜   sD  ø€ Ü‰ÑÔØ×Ñ × :Ñ :Ñ:¸aÓ?ÌÐPVÐXh×HiÑHiÜØ# F×$6Ñ$6Ð#7ð 8Ø ×4Ñ4Ð5°Qð8óð ð
 ŒØ#)×#=Ñ#=ˆÔ Ü#& v×'9Ñ'9¸F×<VÑ<VÑ'VÓ#WˆÔ Ø!×5Ñ5¸×8PÑ8PÑPˆÔä—Y’Y˜v×1Ñ1°4×3EÑ3EÓFˆŒ
Ü—9’9˜V×/Ñ/°×1CÑ1CÓDˆŒÜ—Y’Y˜v×1Ñ1°4×3EÑ3EÓFˆŒ
ä—z’z &×"EÑ"EÓFˆŒØ!'×!DÑ!DˆÔØ×/Ñ/°Ñ5ˆrG   Úhidden_statesrl   rn   Úoutput_attentionsÚreturnc                 óº  • UR                   S S n/ UQSPU R                  P7nU R                  U5      R                  U5      R	                  SS5      nU R                  U5      R                  U5      R	                  SS5      n	U R                  U5      R                  U5      R	                  SS5      n
[        nU R                  R                  S:w  a  [        U R                  R                     nU" U UU	U
U4U R                  (       d  SOU R                  U R                  US.UD6u  pÍUR                  " / UQSP76 R                  5       nU(       a  XÍ4nU$ U4nU$ )Nr%   r   rL   Úeagerç        )r<   rm   rn   )rv   rŒ   ri   r{   ru   rj   rk   r   rC   Ú_attn_implementationr   rs   r   rm   Úreshaper|   )rB   r’   rl   rn   r“   r}   rU   Úhidden_shapeÚquery_statesÚ
key_statesÚvalue_statesÚattention_interfacer€   r~   Úoutputss                  rE   r^   ÚLayoutLMSelfAttention.forward­   s[  € ð $×)Ñ)¨#¨2Ð.ˆØC˜ÐC bÐC¨$×*BÑ*BÑCˆà—z‘z -Ó0×5Ñ5°lÓC×MÑMÈaÐQRÓSˆØ—X‘X˜mÓ,×1Ñ1°,Ó?×IÑIÈ!ÈQÓOˆ
Ø—z‘z -Ó0×5Ñ5°lÓC×MÑMÈaÐQRÓSˆä(?ÐØ;‰;×+Ñ+¨wÓ6Ü"9¸$¿+¹+×:ZÑ:ZÑ"[Ðá$7ØØØØØð
%
ð  $Ÿ}Ÿ}‘C°$×2HÑ2HØ—L‘LØñ
%
ð ñ
%
Ñ!ˆð "×)Ò)Ð;¨;Ð;¸Ò;×FÑFÓHˆÞ1B;Ð-ˆØˆð JUÈˆØˆrG   )
r   r   rŒ   rC   r<   rj   rˆ   ri   rm   rk   ©NNF)r`   ra   rb   rc   r(   r>   ÚTensorr   ÚFloatTensorÚboolÚtupler^   re   rf   rg   s   @rE   rƒ   rƒ   —   st   ø† õ6ð0 7;Ø15Ø,1ñ!à—|‘|ð!ð ! ×!2Ñ!2Ñ3ð!ð ˜E×-Ñ-Ñ.ð	!ð
 $ D™>ð!ð 
ˆu|‰|Ñ	÷!ó !rG   rƒ   c                   óz   ^ • \ rS rSrU 4S jrS\R                  S\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMSelfOutputéÒ   c                 ó(  >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        R                  " UR                  UR                  S9U l        [        R                  " UR                  5      U l
        g ©Nr"   )r'   r(   r   rŽ   r+   Údenser9   r8   r:   r;   r<   rA   s     €rE   r(   ÚLayoutLMSelfOutput.__init__Ó   s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
ÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆrG   r’   Úinput_tensorr”   c                 óp   • U R                  U5      nU R                  U5      nU R                  X-   5      nU$ ©N©r«   r<   r9   ©rB   r’   r­   s      rE   r^   ÚLayoutLMSelfOutput.forwardÙ   ó5   € ØŸ
™
 =Ó1ˆØŸ™ ]Ó3ˆØŸ™ }Ñ'CÓDˆØÐrG   ©r9   r«   r<   ©
r`   ra   rb   rc   r(   r>   r¢   r^   re   rf   rg   s   @rE   r§   r§   Ò   ó6   ø† õ>ð U§\¡\ð ÀÇÁð ÐRW×R^ÑR^÷ ò rG   r§   c                   ó¾   ^ • \ rS rSrU 4S jrS r   SS\R                  S\\R                     S\\R                     S\\
   S\\R                     4
S	 jjrS
rU =r$ )ÚLayoutLMAttentionéá   c                 ó€   >• [         TU ]  5         [        U5      U l        [	        U5      U l        [        5       U l        g r¯   )r'   r(   rƒ   rB   r§   ÚoutputÚsetÚpruned_headsrA   s     €rE   r(   ÚLayoutLMAttention.__init__â   s0   ø€ Ü‰ÑÔÜ)¨&Ó1ˆŒ	Ü(¨Ó0ˆŒÜ›EˆÕrG   c                 ó6  • [        U5      S:X  a  g [        XR                  R                  U R                  R                  U R
                  5      u  p[        U R                  R                  U5      U R                  l        [        U R                  R                  U5      U R                  l        [        U R                  R                  U5      U R                  l	        [        U R                  R                  USS9U R                  l        U R                  R                  [        U5      -
  U R                  l        U R                  R                  U R                  R                  -  U R                  l        U R
                  R                  U5      U l        g )Nr   r   ©rq   )Úlenr   rB   rˆ   rŒ   r½   r   ri   rj   rk   r»   r«   r   Úunion)rB   ÚheadsÚindexs      rE   Úprune_headsÚLayoutLMAttention.prune_headsè   s  € Üˆu‹:˜‹?ØÜ7Ø—9‘9×0Ñ0°$·)±)×2OÑ2OÐQU×QbÑQbó
‰ˆô
 -¨T¯Y©Y¯_©_¸eÓDˆ	‰	ŒÜ*¨4¯9©9¯=©=¸%Ó@ˆ	‰	ŒÜ,¨T¯Y©Y¯_©_¸eÓDˆ	‰	ŒÜ.¨t¯{©{×/@Ñ/@À%ÈQÑOˆ‰Ôð )-¯	©	×(EÑ(EÌÈEË
Ñ(Rˆ	‰	Ô%Ø"&§)¡)×"?Ñ"?À$Ç)Á)×B_ÑB_Ñ"_ˆ	‰	ÔØ ×-Ñ-×3Ñ3°EÓ:ˆÕrG   r’   rl   rn   r“   r”   c                 óp   • U R                   " U4UUUS.UD6nU R                  US   U5      nU4USS  -   nU$ ©N)rl   rn   r“   r   r   )rB   r»   )	rB   r’   rl   rn   r“   r}   Úself_outputsÚattention_outputrŸ   s	            rE   r^   ÚLayoutLMAttention.forwardú   s]   € ð —y’yØð
à)ØØ/ñ	
ð
 ñ
ˆð  Ÿ;™; |°A¡¸ÓFÐØ#Ð%¨°Q°RÐ(8Ñ8ˆØˆrG   )r»   r½   rB   r¡   )r`   ra   rb   rc   r(   rÅ   r>   r¢   r   r£   r¤   r¥   r^   re   rf   rg   s   @rE   r¸   r¸   á   sy   ø† õ"ò;ð* 7;Ø15Ø,1ñà—|‘|ðð ! ×!2Ñ!2Ñ3ðð ˜E×-Ñ-Ñ.ð	ð
 $ D™>ðð 
ˆu|‰|Ñ	÷ó rG   r¸   c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMIntermediatei  c                 ó  >• [         TU ]  5         [        R                  " UR                  UR
                  5      U l        [        UR                  [        5      (       a  [        UR                     U l        g UR                  U l        g r¯   )r'   r(   r   rŽ   r+   Úintermediate_sizer«   Ú
isinstanceÚ
hidden_actÚstrr   Úintermediate_act_fnrA   s     €rE   r(   ÚLayoutLMIntermediate.__init__  s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3KÑ3KÓLˆŒ
Üf×'Ñ'¬×-Ñ-Ü'-¨f×.?Ñ.?Ñ'@ˆDÕ$à'-×'8Ñ'8ˆDÕ$rG   r’   r”   c                 óJ   • U R                  U5      nU R                  U5      nU$ r¯   ©r«   rÓ   ©rB   r’   s     rE   r^   ÚLayoutLMIntermediate.forward  s&   € ØŸ
™
 =Ó1ˆØ×0Ñ0°Ó?ˆØÐrG   rÖ   rµ   rg   s   @rE   rÍ   rÍ     s(   ø† õ9ð U§\¡\ð °e·l±l÷ ò rG   rÍ   c                   óz   ^ • \ rS rSrU 4S jrS\R                  S\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMOutputi  c                 ó(  >• [         TU ]  5         [        R                  " UR                  UR
                  5      U l        [        R                  " UR
                  UR                  S9U l        [        R                  " UR                  5      U l        g rª   )r'   r(   r   rŽ   rÏ   r+   r«   r9   r8   r:   r;   r<   rA   s     €rE   r(   ÚLayoutLMOutput.__init__   s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×7Ñ7¸×9KÑ9KÓLˆŒ
ÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆrG   r’   r­   r”   c                 óp   • U R                  U5      nU R                  U5      nU R                  X-   5      nU$ r¯   r°   r±   s      rE   r^   ÚLayoutLMOutput.forward&  r³   rG   r´   rµ   rg   s   @rE   rÚ   rÚ     r¶   rG   rÚ   c                   ó¾   ^ • \ rS rSrU 4S jr   SS\R                  S\\R                     S\\R                     S\\	   S\
\R                     4
S jjrS	 rS
rU =r$ )ÚLayoutLMLayeri.  c                 ó²   >• [         TU ]  5         UR                  U l        SU l        [	        U5      U l        [        U5      U l        [        U5      U l	        g )Nr   )
r'   r(   Úchunk_size_feed_forwardÚseq_len_dimr¸   Ú	attentionrÍ   ÚintermediaterÚ   r»   rA   s     €rE   r(   ÚLayoutLMLayer.__init__/  sI   ø€ Ü‰ÑÔØ'-×'EÑ'EˆÔ$ØˆÔÜ*¨6Ó2ˆŒÜ0°Ó8ˆÔÜ$ VÓ,ˆrG   r’   rl   rn   r“   r”   c                 ó¬   • U R                   " U4UUUS.UD6nUS   nUSS  n[        U R                  U R                  U R                  U5      n	U	4U-   nU$ rÈ   )rä   r   Úfeed_forward_chunkrâ   rã   )
rB   r’   rl   rn   r“   r}   Úself_attention_outputsrÊ   rŸ   Úlayer_outputs
             rE   r^   ÚLayoutLMLayer.forward7  s€   € ð "&§¢Øð"
à)ØØ/ñ	"
ð
 ñ"
Ðð 2°!Ñ4Ðà(¨¨Ð,ˆÜ0Ø×#Ñ# T×%AÑ%AÀ4×CSÑCSÐUeó
ˆð  / GÑ+ˆàˆrG   c                 óJ   • U R                  U5      nU R                  X!5      nU$ r¯   )rå   r»   )rB   rÊ   Úintermediate_outputrê   s       rE   rè   Ú LayoutLMLayer.feed_forward_chunkP  s)   € Ø"×/Ñ/Ð0@ÓAÐØ—{‘{Ð#6ÓIˆØÐrG   )rä   râ   rå   r»   rã   r¡   )r`   ra   rb   rc   r(   r>   r¢   r   r£   r¤   r¥   r^   rè   re   rf   rg   s   @rE   rà   rà   .  sy   ø† õ-ð 7;Ø15Ø,1ñà—|‘|ðð ! ×!2Ñ!2Ñ3ðð ˜E×-Ñ-Ñ.ð	ð
 $ D™>ðð 
ˆu|‰|Ñ	õ÷2ð rG   rà   c                   óä   ^ • \ rS rSrU 4S jr\     SS\R                  S\\R                     S\\R                     S\\
   S\\
   S\\
   S	\\\R                     \4   4S
 jj5       rSrU =r$ )ÚLayoutLMEncoderiW  c                 óÔ   >• [         TU ]  5         Xl        [        R                  " [        UR                  5       Vs/ sH  n[        U5      PM     sn5      U l        SU l	        g s  snf )NF)
r'   r(   rC   r   Ú
ModuleListÚrangeÚnum_hidden_layersrà   ÚlayerÚgradient_checkpointing)rB   rC   ÚirD   s      €rE   r(   ÚLayoutLMEncoder.__init__X  sR   ø€ Ü‰ÑÔØŒÜ—]’]Ä5È×IaÑIaÔCbÓ#cÑCb¸a¤M°&Ö$9ÑCbÑ#cÓdˆŒ
Ø&+ˆÕ#ùò $ds   ½A%r’   rl   rn   r“   Úoutput_hidden_statesÚreturn_dictr”   c           	      ó  • U(       a  SOS nU(       a  SOS n	[        U R                  5       H=  u  p«U(       a  X4-   nUb  X:   OS nU" SUUUUS.UD6nUS   nU(       d  M5  XS   4-   n	M?     U(       a  X4-   n[        UUU	S9$ )N© )r’   rl   rn   r“   r   r   )Úlast_hidden_stater’   Ú
attentions)Ú	enumeraterõ   r   )rB   r’   rl   rn   r“   rù   rú   r}   Úall_hidden_statesÚall_self_attentionsr÷   Úlayer_moduleÚlayer_head_maskÚlayer_outputss                 rE   r^   ÚLayoutLMEncoder.forward^  s¹   € ö #7™B¸DÐÞ$5™b¸4Ðä(¨¯©Ö4‰OˆAÞ#Ø$5Ð8HÑ$HÐ!à.7Ñ.C˜išlÈˆOá(ð Ø+Ø-Ø)Ø"3ñ	ð
 ñˆMð *¨!Ñ,ˆMß Ð Ø&9È1Ñ=MÐ<OÑ&OÒ#ñ!  5ö$  Ø 1Ð4DÑ DÐäØ+Ø+Ø*ñ
ð 	
rG   )rC   rö   rõ   )NNFFT)r`   ra   rb   rc   r(   r   r>   r¢   r   r£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   rð   rð   W  sª   ø† õ,ð ð 7;Ø15Ø,1Ø/4Ø&*ñ&
à—|‘|ð&
ð ! ×!2Ñ!2Ñ3ð&
ð ˜E×-Ñ-Ñ.ð	&
ð
 $ D™>ð&
ð ' t™nð&
ð ˜d‘^ð&
ð 
ˆuU—\‘\Ñ" OÐ3Ñ	4ô&
ó ö&
rG   rð   c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMPooleri‰  c                 ó¶   >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        R                  " 5       U l        g r¯   )r'   r(   r   rŽ   r+   r«   ÚTanhÚ
activationrA   s     €rE   r(   ÚLayoutLMPooler.__init__Š  s9   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
ÜŸ'š'›)ˆrG   r’   r”   c                 ó\   • US S 2S4   nU R                  U5      nU R                  U5      nU$ )Nr   )r«   r
  )rB   r’   Úfirst_token_tensorÚpooled_outputs       rE   r^   ÚLayoutLMPooler.forward  s6   € ð +ª1¨a¨4Ñ0ÐØŸ
™
Ð#5Ó6ˆØŸ™¨Ó6ˆØÐrG   )r
  r«   rµ   rg   s   @rE   r  r  ‰  s(   ø† õ$ð
 U§\¡\ð °e·l±l÷ ò rG   r  c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMPredictionHeadTransformi™  c                 óp  >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        UR                  [        5      (       a  [        UR                     U l
        OUR                  U l
        [        R                  " UR                  UR                  S9U l        g rª   )r'   r(   r   rŽ   r+   r«   rÐ   rÑ   rÒ   r   Útransform_act_fnr9   r8   rA   s     €rE   r(   Ú(LayoutLMPredictionHeadTransform.__init__š  s~   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
Üf×'Ñ'¬×-Ñ-Ü$*¨6×+<Ñ+<Ñ$=ˆDÕ!à$*×$5Ñ$5ˆDÔ!ÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆrG   r’   r”   c                 ól   • U R                  U5      nU R                  U5      nU R                  U5      nU$ r¯   )r«   r  r9   r×   s     rE   r^   Ú'LayoutLMPredictionHeadTransform.forward£  s4   € ØŸ
™
 =Ó1ˆØ×-Ñ-¨mÓ<ˆØŸ™ }Ó5ˆØÐrG   )r9   r«   r  rµ   rg   s   @rE   r  r  ™  s)   ø† õUð U§\¡\ð °e·l±l÷ ò rG   r  c                   ó4   ^ • \ rS rSrU 4S jrS rS rSrU =r$ )ÚLayoutLMLMPredictionHeadi«  c                 óH  >• [         TU ]  5         [        U5      U l        [        R
                  " UR                  UR                  SS9U l        [        R                  " [        R                  " UR                  5      5      U l        U R                  U R                  l        g )NF)Úbias)r'   r(   r  Ú	transformr   rŽ   r+   r*   ÚdecoderÚ	Parameterr>   rN   r  rA   s     €rE   r(   Ú!LayoutLMLMPredictionHead.__init__¬  sm   ø€ Ü‰ÑÔÜ8¸Ó@ˆŒô —y’y ×!3Ñ!3°V×5FÑ5FÈUÑSˆŒä—L’L¤§¢¨V×->Ñ->Ó!?Ó@ˆŒ	ð !ŸI™Iˆ‰ÕrG   c                 ó:   • U R                   U R                  l         g r¯   )r  r  ©rB   s    rE   Ú_tie_weightsÚ%LayoutLMLMPredictionHead._tie_weights¹  s   € Ø ŸI™Iˆ‰ÕrG   c                 óJ   • U R                  U5      nU R                  U5      nU$ r¯   )r  r  r×   s     rE   r^   Ú LayoutLMLMPredictionHead.forward¼  s$   € ØŸ™ }Ó5ˆØŸ™ ]Ó3ˆØÐrG   )r  r  r  )	r`   ra   rb   rc   r(   r!  r^   re   rf   rg   s   @rE   r  r  «  s   ø† õ&ò&÷ð rG   r  c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )ÚLayoutLMOnlyMLMHeadiÃ  c                 óB   >• [         TU ]  5         [        U5      U l        g r¯   )r'   r(   r  ÚpredictionsrA   s     €rE   r(   ÚLayoutLMOnlyMLMHead.__init__Ä  s   ø€ Ü‰ÑÔÜ3°FÓ;ˆÕrG   Úsequence_outputr”   c                 ó(   • U R                  U5      nU$ r¯   ©r(  )rB   r*  Úprediction_scoress      rE   r^   ÚLayoutLMOnlyMLMHead.forwardÈ  s   € Ø ×,Ñ,¨_Ó=ÐØ Ð rG   r,  rµ   rg   s   @rE   r&  r&  Ã  s(   ø† õ<ð! u§|¡|ð !¸¿¹÷ !ò !rG   r&  c                   ó.   • \ rS rSr% \\S'   SrSrS rSr	g)ÚLayoutLMPreTrainedModeliÍ  rC   ÚlayoutlmTc                 óx  • [        U[        R                  5      (       ak  UR                  R                  R                  SU R                  R                  S9  UR                  b%  UR                  R                  R                  5         gg[        U[        R                  5      (       ax  UR                  R                  R                  SU R                  R                  S9  UR                  b2  UR                  R                  UR                     R                  5         gg[        U[        5      (       aJ  UR                  R                  R                  5         UR                  R                  R                  S5        g[        U[        5      (       a%  UR                  R                  R                  5         gg)zInitialize the weightsr—   )ÚmeanÚstdNç      ð?)rÐ   r   rŽ   ÚweightÚdataÚnormal_rC   Úinitializer_ranger  Úzero_r)   r!   r7   Úfill_r  )rB   rh   s     rE   Ú_init_weightsÚ%LayoutLMPreTrainedModel._init_weightsÓ  s0  € äfœbŸi™i×(Ñ(ð M‰M×Ñ×&Ñ&¨C°T·[±[×5RÑ5RÐ&ÑSØ{‰{Ñ&Ø—‘× Ñ ×&Ñ&Õ(ð 'ä˜¤§¡×-Ñ-ØM‰M×Ñ×&Ñ&¨C°T·[±[×5RÑ5RÐ&ÑSØ×!Ñ!Ñ-Ø—‘×"Ñ" 6×#5Ñ#5Ñ6×<Ñ<Õ>ð .ä˜Ô 1×2Ñ2ØK‰K×Ñ×"Ñ"Ô$ØM‰M×Ñ×$Ñ$ SÕ)Ü˜Ô 8×9Ñ9ØK‰K×Ñ×"Ñ"Õ$ð :rG   rü   N)
r`   ra   rb   rc   r   Ú__annotations__Úbase_model_prefixÚsupports_gradient_checkpointingr<  re   rü   rG   rE   r0  r0  Í  s   ‡ àÓØ"ÐØ&*Ð#õ%rG   r0  c                   ón  ^ • \ rS rSrU 4S jrS rS rS r\\	          SS\
\R                     S\
\R                     S\
\R                     S	\
\R                     S
\
\R                     S\
\R                     S\
\R                     S\
\   S\
\   S\
\   S\\\4   4S jj5       5       rSrU =r$ )ÚLayoutLMModeliæ  c                 ó°   >• [         TU ]  U5        Xl        [        U5      U l        [        U5      U l        [        U5      U l        U R                  5         g r¯   )
r'   r(   rC   r   r]   rð   Úencoderr  ÚpoolerÚ	post_initrA   s     €rE   r(   ÚLayoutLMModel.__init__è  sE   ø€ Ü‰Ñ˜Ô ØŒä,¨VÓ4ˆŒÜ& vÓ.ˆŒÜ$ VÓ,ˆŒð 	‰ÕrG   c                 ó.   • U R                   R                  $ r¯   ©r]   r-   r   s    rE   Úget_input_embeddingsÚ"LayoutLMModel.get_input_embeddingsó  s   € Ø‰×.Ñ.Ð.rG   c                 ó$   • XR                   l        g r¯   rI  )rB   rk   s     rE   Úset_input_embeddingsÚ"LayoutLMModel.set_input_embeddingsö  s   € Ø*/‰Õ'rG   c                 óš   • UR                  5        H7  u  p#U R                  R                  U   R                  R	                  U5        M9     g)z…
Prunes heads of the model. heads_to_prune: dict of {layer_num: list of heads to prune in this layer} See base
class PreTrainedModel
N)ÚitemsrD  rõ   rä   rÅ   )rB   Úheads_to_prunerõ   rÃ   s       rE   Ú_prune_headsÚLayoutLMModel._prune_headsù  s<   € ð
 +×0Ñ0Ö2‰LˆEØL‰L×Ñ˜uÑ%×/Ñ/×;Ñ;¸EÖBò 3rG   rQ   rR   rl   rS   r$   rn   rT   r“   rù   rú   r”   c           	      ó   • Ub  UOU R                   R                  nU	b  U	OU R                   R                  n	U
b  U
OU R                   R                  n
Ub  Ub  [	        S5      eUb"  U R                  X5        UR                  5       nO"Ub  UR                  5       SS nO[	        S5      eUb  UR                  OUR                  nUc  [        R                  " X¼S9nUc$  [        R                  " U[        R                  US9nUc'  [        R                  " US-   [        R                  US9nUR                  S5      R                  S	5      nUR                  U R                  S
9nSU-
  [        R                  " U R                  5      R                   -  nUbð  UR#                  5       S:X  ah  UR                  S5      R                  S5      R                  S5      R                  S5      nUR%                  U R                   R&                  SSSS5      nOCUR#                  5       S	:X  a/  UR                  S5      R                  S5      R                  S5      nUR                  [)        U R+                  5       5      R                  S
9nOS/U R                   R&                  -  nU R-                  UUUUUS9nU R/                  UUUUU	SS9nUS   nU R1                  U5      n[3        UUUR4                  UR6                  S9$ )a  
bbox (`torch.LongTensor` of shape `(batch_size, sequence_length, 4)`, *optional*):
    Bounding boxes of each input sequence tokens. Selected in the range `[0,
    config.max_2d_position_embeddings-1]`. Each bounding box should be a normalized version in (x0, y0, x1, y1)
    format, where (x0, y0) corresponds to the position of the upper left corner in the bounding box, and (x1,
    y1) represents the position of the lower right corner. See [Overview](#Overview) for normalization.

Examples:

```python
>>> from transformers import AutoTokenizer, LayoutLMModel
>>> import torch

>>> tokenizer = AutoTokenizer.from_pretrained("microsoft/layoutlm-base-uncased")
>>> model = LayoutLMModel.from_pretrained("microsoft/layoutlm-base-uncased")

>>> words = ["Hello", "world"]
>>> normalized_word_boxes = [637, 773, 693, 782], [698, 773, 733, 782]

>>> token_boxes = []
>>> for word, box in zip(words, normalized_word_boxes):
...     word_tokens = tokenizer.tokenize(word)
...     token_boxes.extend([box] * len(word_tokens))
>>> # add bounding boxes of cls + sep tokens
>>> token_boxes = [[0, 0, 0, 0]] + token_boxes + [[1000, 1000, 1000, 1000]]

>>> encoding = tokenizer(" ".join(words), return_tensors="pt")
>>> input_ids = encoding["input_ids"]
>>> attention_mask = encoding["attention_mask"]
>>> token_type_ids = encoding["token_type_ids"]
>>> bbox = torch.tensor([token_boxes])

>>> outputs = model(
...     input_ids=input_ids, bbox=bbox, attention_mask=attention_mask, token_type_ids=token_type_ids
... )

>>> last_hidden_states = outputs.last_hidden_state
```NzDYou cannot specify both input_ids and inputs_embeds at the same timer%   z5You have to specify either input_ids or inputs_embeds)rK   rI   )é   r   rL   )rJ   r5  r   )rQ   rR   r$   rS   rT   T)rn   r“   rù   rú   )rý   Úpooler_outputr’   rþ   )rC   r“   rù   Úuse_return_dictrŠ   Ú%warn_if_padding_and_no_attention_maskrM   rK   r>   ÚonesrN   rO   Ú	unsqueezerz   rJ   ÚfinfoÚminrq   r@   rô   ÚnextÚ
parametersr]   rD  rE  r   r’   rþ   )rB   rQ   rR   rl   rS   r$   rn   rT   r“   rù   rú   rU   rK   Úextended_attention_maskÚembedding_outputÚencoder_outputsr*  r  s                     rE   r^   ÚLayoutLMModel.forward  sÔ  € ðj 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆàÑ  ]Ñ%>ÜÐcÓdÐdØÑ"Ø×6Ñ6°yÔQØ#Ÿ.™.Ó*‰KØÑ&Ø'×,Ñ,Ó.¨s°Ð3‰KäÐTÓUÐUà%.Ñ%:×!Ò!À×@TÑ@TˆàÑ!Ü"ŸZšZ¨ÑCˆNØÑ!Ü"Ÿ[š[¨¼E¿J¹JÈvÑVˆNà‰<Ü—;’;˜{¨TÑ1¼¿¹ÈFÑSˆDà"0×":Ñ":¸1Ó"=×"GÑ"GÈÓ"JÐà"9×"<Ñ"<À4Ç:Á:Ð"<Ð"NÐØ#&Ð)@Ñ#@ÄEÇKÂKÐPT×PZÑPZÓD[×D_ÑD_Ñ"_ÐàÑ Ø}‰}‹ !Ó#Ø%×/Ñ/°Ó2×<Ñ<¸QÓ?×IÑIÈ"ÓM×WÑWÐXZÓ[	Ø%×,Ñ,¨T¯[©[×-JÑ-JÈBÐPRÐTVÐXZÓ[‘	Ø—‘“ AÓ%Ø%×/Ñ/°Ó2×<Ñ<¸RÓ@×JÑJÈ2ÓN	Ø!Ÿ™¬4°·±Ó0AÓ+B×+HÑ+H˜ÐI‰Ià˜ §¡×!>Ñ!>Ñ>ˆIàŸ?™?ØØØ%Ø)Ø'ð +ð 
Ðð Ÿ,™,ØØ#ØØ/Ø!5Øð 'ð 
ˆð *¨!Ñ,ˆØŸ™ OÓ4ˆä)Ø-Ø'Ø)×7Ñ7Ø&×1Ñ1ñ	
ð 	
rG   )rC   r]   rD  rE  )
NNNNNNNNNN)r`   ra   rb   rc   r(   rJ  rM  rR  r   r   r   r>   Ú
LongTensorr£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   rB  rB  æ  s1  ø† õ	ò/ò0òCð Øð 15Ø+/Ø6:Ø59Ø37Ø15Ø59Ø,0Ø/3Ø&*ñs
à˜E×,Ñ,Ñ-ðs
ð u×'Ñ'Ñ(ðs
ð ! ×!2Ñ!2Ñ3ð	s
ð
 ! ×!1Ñ!1Ñ2ðs
ð ˜u×/Ñ/Ñ0ðs
ð ˜E×-Ñ-Ñ.ðs
ð   × 1Ñ 1Ñ2ðs
ð $ D™>ðs
ð ' t™nðs
ð ˜d‘^ðs
ð 
ˆuÐ0Ð0Ñ	1ôs
ó ó ös
rG   rB  c                   ó–  ^ • \ rS rSrSS/rU 4S jrS rS rS r\	\
           SS\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\   S\\   S\\   S\\\4   4S jj5       5       rSrU =r$ )ÚLayoutLMForMaskedLMiy  zcls.predictions.decoder.biaszcls.predictions.decoder.weightc                 ó„   >• [         TU ]  U5        [        U5      U l        [	        U5      U l        U R                  5         g r¯   )r'   r(   rB  r1  r&  ÚclsrF  rA   s     €rE   r(   ÚLayoutLMForMaskedLM.__init__}  s4   ø€ Ü‰Ñ˜Ô ä% fÓ-ˆŒÜ& vÓ.ˆŒð 	‰ÕrG   c                 óB   • U R                   R                  R                  $ r¯   ©r1  r]   r-   r   s    rE   rJ  Ú(LayoutLMForMaskedLM.get_input_embeddings†  ó   € Ø}‰}×'Ñ'×7Ñ7Ð7rG   c                 óB   • U R                   R                  R                  $ r¯   )rg  r(  r  r   s    rE   Úget_output_embeddingsÚ)LayoutLMForMaskedLM.get_output_embeddings‰  s   € Øx‰x×#Ñ#×+Ñ+Ð+rG   c                 ó‚   • XR                   R                  l        UR                  U R                   R                  l        g r¯   )rg  r(  r  r  )rB   Únew_embeddingss     rE   Úset_output_embeddingsÚ)LayoutLMForMaskedLM.set_output_embeddingsŒ  s*   € Ø'5‰×ÑÔ$Ø$2×$7Ñ$7ˆ‰×ÑÕ!rG   rQ   rR   rl   rS   r$   rn   rT   Úlabelsr“   rù   rú   r”   c                 ój  • Ub  UOU R                   R                  nU R                  UUUUUUUU	U
SS9
nUS   nU R                  U5      nSnUbF  [	        5       nU" UR                  SU R                   R                  5      UR                  S5      5      n[        UUUR                  UR                  S9$ )a  
bbox (`torch.LongTensor` of shape `(batch_size, sequence_length, 4)`, *optional*):
    Bounding boxes of each input sequence tokens. Selected in the range `[0,
    config.max_2d_position_embeddings-1]`. Each bounding box should be a normalized version in (x0, y0, x1, y1)
    format, where (x0, y0) corresponds to the position of the upper left corner in the bounding box, and (x1,
    y1) represents the position of the lower right corner. See [Overview](#Overview) for normalization.
labels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):
    Labels for computing the masked language modeling loss. Indices should be in `[-100, 0, ...,
    config.vocab_size]` (see `input_ids` docstring) Tokens with indices set to `-100` are ignored (masked), the
    loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`

Examples:

```python
>>> from transformers import AutoTokenizer, LayoutLMForMaskedLM
>>> import torch

>>> tokenizer = AutoTokenizer.from_pretrained("microsoft/layoutlm-base-uncased")
>>> model = LayoutLMForMaskedLM.from_pretrained("microsoft/layoutlm-base-uncased")

>>> words = ["Hello", "[MASK]"]
>>> normalized_word_boxes = [637, 773, 693, 782], [698, 773, 733, 782]

>>> token_boxes = []
>>> for word, box in zip(words, normalized_word_boxes):
...     word_tokens = tokenizer.tokenize(word)
...     token_boxes.extend([box] * len(word_tokens))
>>> # add bounding boxes of cls + sep tokens
>>> token_boxes = [[0, 0, 0, 0]] + token_boxes + [[1000, 1000, 1000, 1000]]

>>> encoding = tokenizer(" ".join(words), return_tensors="pt")
>>> input_ids = encoding["input_ids"]
>>> attention_mask = encoding["attention_mask"]
>>> token_type_ids = encoding["token_type_ids"]
>>> bbox = torch.tensor([token_boxes])

>>> labels = tokenizer("Hello world", return_tensors="pt")["input_ids"]

>>> outputs = model(
...     input_ids=input_ids,
...     bbox=bbox,
...     attention_mask=attention_mask,
...     token_type_ids=token_type_ids,
...     labels=labels,
... )

>>> loss = outputs.loss
```NT)rl   rS   r$   rn   rT   r“   rù   rú   r   r%   ©ÚlossÚlogitsr’   rþ   )
rC   rW  r1  rg  r   r{   r*   r   r’   rþ   )rB   rQ   rR   rl   rS   r$   rn   rT   rt  r“   rù   rú   rŸ   r*  r-  Úmasked_lm_lossÚloss_fcts                    rE   r^   ÚLayoutLMForMaskedLM.forward  sÏ   € ð@ &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—-‘-ØØØ)Ø)Ø%ØØ'Ø/Ø!5Øð  ð 
ˆð " !™*ˆØ ŸH™H _Ó5ÐàˆØÑÜ'Ó)ˆHÙ%Ø!×&Ñ& r¨4¯;©;×+AÑ+AÓBØ—‘˜B“óˆNô
 ØØ$Ø!×/Ñ/Ø×)Ñ)ñ	
ð 	
rG   )rg  r1  ©NNNNNNNNNNN)r`   ra   rb   rc   Ú_tied_weights_keysr(   rJ  rn  rr  r   r   r   r>   rc  r£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   re  re  y  sT  ø† à8Ð:ZÐ[Ðõò8ò,ò8ð Øð 15Ø+/Ø6:Ø59Ø37Ø15Ø59Ø-1Ø,0Ø/3Ø&*ñ]
à˜E×,Ñ,Ñ-ð]
ð u×'Ñ'Ñ(ð]
ð ! ×!2Ñ!2Ñ3ð	]
ð
 ! ×!1Ñ!1Ñ2ð]
ð ˜u×/Ñ/Ñ0ð]
ð ˜E×-Ñ-Ñ.ð]
ð   × 1Ñ 1Ñ2ð]
ð ˜×)Ñ)Ñ*ð]
ð $ D™>ð]
ð ' t™nð]
ð ˜d‘^ð]
ð 
ˆunÐ$Ñ	%ô]
ó ó ö]
rG   re  zì
    LayoutLM Model with a sequence classification head on top (a linear layer on top of the pooled output) e.g. for
    document image classification tasks such as the [RVL-CDIP](https://www.cs.cmu.edu/~aharley/rvl-cdip/) dataset.
    )Úcustom_introc                   ó‚  ^ • \ rS rSrU 4S jrS r\\           SS\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\	R                     S	\\	R                     S
\\	R                     S\\	R                     S\\   S\\   S\\   S\\\4   4S jj5       5       rSrU =r$ )Ú!LayoutLMForSequenceClassificationiò  c                 ó0  >• [         TU ]  U5        UR                  U l        [        U5      U l        [
        R                  " UR                  5      U l        [
        R                  " UR                  UR                  5      U l        U R                  5         g r¯   ©r'   r(   Ú
num_labelsrB  r1  r   r:   r;   r<   rŽ   r+   Ú
classifierrF  rA   s     €rE   r(   Ú*LayoutLMForSequenceClassification.__init__ù  ói   ø€ Ü‰Ñ˜Ô Ø ×+Ñ+ˆŒÜ% fÓ-ˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒÜŸ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰ÕrG   c                 óB   • U R                   R                  R                  $ r¯   rj  r   s    rE   rJ  Ú6LayoutLMForSequenceClassification.get_input_embeddings  rl  rG   rQ   rR   rl   rS   r$   rn   rT   rt  r“   rù   rú   r”   c                 ó  • Ub  UOU R                   R                  nU R                  UUUUUUUU	U
SS9
nUS   nU R                  U5      nU R	                  U5      nSnUGbŽ  U R                   R
                  c‘  U R                  S:X  a  SU R                   l        OoU R                  S:”  aN  UR                  [        R                  :X  d  UR                  [        R                  :X  a  SU R                   l        OSU R                   l        U R                   R
                  S:X  aI  [        5       nU R                  S:X  a&  U" UR                  5       UR                  5       5      nOŒU" Xè5      nOƒU R                   R
                  S:X  a=  [        5       nU" UR                  SU R                  5      UR                  S5      5      nO,U R                   R
                  S:X  a  [        5       nU" Xè5      n[!        UUUR"                  UR$                  S	9$ )
a
  
bbox (`torch.LongTensor` of shape `(batch_size, sequence_length, 4)`, *optional*):
    Bounding boxes of each input sequence tokens. Selected in the range `[0,
    config.max_2d_position_embeddings-1]`. Each bounding box should be a normalized version in (x0, y0, x1, y1)
    format, where (x0, y0) corresponds to the position of the upper left corner in the bounding box, and (x1,
    y1) represents the position of the lower right corner. See [Overview](#Overview) for normalization.
labels (`torch.LongTensor` of shape `(batch_size,)`, *optional*):
    Labels for computing the sequence classification/regression loss. Indices should be in `[0, ...,
    config.num_labels - 1]`. If `config.num_labels == 1` a regression loss is computed (Mean-Square loss), If
    `config.num_labels > 1` a classification loss is computed (Cross-Entropy).

Examples:

```python
>>> from transformers import AutoTokenizer, LayoutLMForSequenceClassification
>>> import torch

>>> tokenizer = AutoTokenizer.from_pretrained("microsoft/layoutlm-base-uncased")
>>> model = LayoutLMForSequenceClassification.from_pretrained("microsoft/layoutlm-base-uncased")

>>> words = ["Hello", "world"]
>>> normalized_word_boxes = [637, 773, 693, 782], [698, 773, 733, 782]

>>> token_boxes = []
>>> for word, box in zip(words, normalized_word_boxes):
...     word_tokens = tokenizer.tokenize(word)
...     token_boxes.extend([box] * len(word_tokens))
>>> # add bounding boxes of cls + sep tokens
>>> token_boxes = [[0, 0, 0, 0]] + token_boxes + [[1000, 1000, 1000, 1000]]

>>> encoding = tokenizer(" ".join(words), return_tensors="pt")
>>> input_ids = encoding["input_ids"]
>>> attention_mask = encoding["attention_mask"]
>>> token_type_ids = encoding["token_type_ids"]
>>> bbox = torch.tensor([token_boxes])
>>> sequence_label = torch.tensor([1])

>>> outputs = model(
...     input_ids=input_ids,
...     bbox=bbox,
...     attention_mask=attention_mask,
...     token_type_ids=token_type_ids,
...     labels=sequence_label,
... )

>>> loss = outputs.loss
>>> logits = outputs.logits
```NT©
rQ   rR   rl   rS   r$   rn   rT   r“   rù   rú   r   Ú
regressionÚsingle_label_classificationÚmulti_label_classificationr%   rv  )rC   rW  r1  r<   r„  Úproblem_typerƒ  rJ   r>   rO   r‹   r	   Úsqueezer   r{   r   r   r’   rþ   )rB   rQ   rR   rl   rS   r$   rn   rT   rt  r“   rù   rú   rŸ   r  rx  rw  rz  s                    rE   r^   Ú)LayoutLMForSequenceClassification.forward  s¼  € ð@ &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—-‘-ØØØ)Ø)Ø%ØØ'Ø/Ø!5Øð  ð 
ˆð   ™
ˆàŸ™ ]Ó3ˆØ—‘ Ó/ˆàˆØÒØ{‰{×'Ñ'Ñ/Ø—?‘? aÓ'Ø/;D—K‘KÕ,Ø—_‘_ qÓ(¨f¯l©l¼e¿j¹jÓ.HÈFÏLÉLÔ\a×\eÑ\eÓLeØ/LD—K‘KÕ,à/KD—K‘KÔ,à{‰{×'Ñ'¨<Ó7Ü"›9Ø—?‘? aÓ'Ù# F§N¡NÓ$4°f·n±nÓ6FÓG‘Dá# FÓ3‘DØ—‘×)Ñ)Ð-JÓJÜ+Ó-Ù §¡¨B°·±Ó @À&Ç+Á+ÈbÃ/ÓR‘Ø—‘×)Ñ)Ð-IÓIÜ,Ó.Ù Ó/ä'ØØØ!×/Ñ/Ø×)Ñ)ñ	
ð 	
rG   ©r„  r<   r1  rƒ  r|  )r`   ra   rb   rc   r(   rJ  r   r   r   r>   rc  r£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   r€  r€  ò  s?  ø† õò8ð Øð 15Ø+/Ø6:Ø59Ø37Ø15Ø59Ø-1Ø,0Ø/3Ø&*ñn
à˜E×,Ñ,Ñ-ðn
ð u×'Ñ'Ñ(ðn
ð ! ×!2Ñ!2Ñ3ð	n
ð
 ! ×!1Ñ!1Ñ2ðn
ð ˜u×/Ñ/Ñ0ðn
ð ˜E×-Ñ-Ñ.ðn
ð   × 1Ñ 1Ñ2ðn
ð ˜×)Ñ)Ñ*ðn
ð $ D™>ðn
ð ' t™nðn
ð ˜d‘^ðn
ð 
ˆuÐ.Ð.Ñ	/ôn
ó ó ön
rG   r€  a3  
    LayoutLM Model with a token classification head on top (a linear layer on top of the hidden-states output) e.g. for
    sequence labeling (information extraction) tasks such as the [FUNSD](https://guillaumejaume.github.io/FUNSD/)
    dataset and the [SROIE](https://rrc.cvc.uab.es/?ch=13) dataset.
    c                   ó‚  ^ • \ rS rSrU 4S jrS r\\           SS\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\	R                     S	\\	R                     S
\\	R                     S\\	R                     S\\   S\\   S\\   S\\\4   4S jj5       5       rSrU =r$ )ÚLayoutLMForTokenClassificationiy  c                 ó0  >• [         TU ]  U5        UR                  U l        [        U5      U l        [
        R                  " UR                  5      U l        [
        R                  " UR                  UR                  5      U l        U R                  5         g r¯   r‚  rA   s     €rE   r(   Ú'LayoutLMForTokenClassification.__init__  r†  rG   c                 óB   • U R                   R                  R                  $ r¯   rj  r   s    rE   rJ  Ú3LayoutLMForTokenClassification.get_input_embeddings‹  rl  rG   rQ   rR   rl   rS   r$   rn   rT   rt  r“   rù   rú   r”   c                 óx  • Ub  UOU R                   R                  nU R                  UUUUUUUU	U
SS9
nUS   nU R                  U5      nU R	                  U5      nSnUb<  [        5       nU" UR                  SU R                  5      UR                  S5      5      n[        UUUR                  UR                  S9$ )a‡  
bbox (`torch.LongTensor` of shape `(batch_size, sequence_length, 4)`, *optional*):
    Bounding boxes of each input sequence tokens. Selected in the range `[0,
    config.max_2d_position_embeddings-1]`. Each bounding box should be a normalized version in (x0, y0, x1, y1)
    format, where (x0, y0) corresponds to the position of the upper left corner in the bounding box, and (x1,
    y1) represents the position of the lower right corner. See [Overview](#Overview) for normalization.
labels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):
    Labels for computing the token classification loss. Indices should be in `[0, ..., config.num_labels - 1]`.

Examples:

```python
>>> from transformers import AutoTokenizer, LayoutLMForTokenClassification
>>> import torch

>>> tokenizer = AutoTokenizer.from_pretrained("microsoft/layoutlm-base-uncased")
>>> model = LayoutLMForTokenClassification.from_pretrained("microsoft/layoutlm-base-uncased")

>>> words = ["Hello", "world"]
>>> normalized_word_boxes = [637, 773, 693, 782], [698, 773, 733, 782]

>>> token_boxes = []
>>> for word, box in zip(words, normalized_word_boxes):
...     word_tokens = tokenizer.tokenize(word)
...     token_boxes.extend([box] * len(word_tokens))
>>> # add bounding boxes of cls + sep tokens
>>> token_boxes = [[0, 0, 0, 0]] + token_boxes + [[1000, 1000, 1000, 1000]]

>>> encoding = tokenizer(" ".join(words), return_tensors="pt")
>>> input_ids = encoding["input_ids"]
>>> attention_mask = encoding["attention_mask"]
>>> token_type_ids = encoding["token_type_ids"]
>>> bbox = torch.tensor([token_boxes])
>>> token_labels = torch.tensor([1, 1, 0, 0]).unsqueeze(0)  # batch size of 1

>>> outputs = model(
...     input_ids=input_ids,
...     bbox=bbox,
...     attention_mask=attention_mask,
...     token_type_ids=token_type_ids,
...     labels=token_labels,
... )

>>> loss = outputs.loss
>>> logits = outputs.logits
```NTrŠ  r   r%   rv  )rC   rW  r1  r<   r„  r   r{   rƒ  r   r’   rþ   )rB   rQ   rR   rl   rS   r$   rn   rT   rt  r“   rù   rú   rŸ   r*  rx  rw  rz  s                    rE   r^   Ú&LayoutLMForTokenClassification.forwardŽ  sÎ   € ð| &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—-‘-ØØØ)Ø)Ø%ØØ'Ø/Ø!5Øð  ð 
ˆð " !™*ˆàŸ,™, Ó7ˆØ—‘ Ó1ˆàˆØÑÜ'Ó)ˆHÙ˜FŸK™K¨¨D¯O©OÓ<¸f¿k¹kÈ"»oÓNˆDä$ØØØ!×/Ñ/Ø×)Ñ)ñ	
ð 	
rG   r‘  r|  )r`   ra   rb   rc   r(   rJ  r   r   r   r>   rc  r£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   r“  r“  y  s?  ø† õò8ð Øð 15Ø+/Ø6:Ø59Ø37Ø15Ø59Ø-1Ø,0Ø/3Ø&*ñZ
à˜E×,Ñ,Ñ-ðZ
ð u×'Ñ'Ñ(ðZ
ð ! ×!2Ñ!2Ñ3ð	Z
ð
 ! ×!1Ñ!1Ñ2ðZ
ð ˜u×/Ñ/Ñ0ðZ
ð ˜E×-Ñ-Ñ.ðZ
ð   × 1Ñ 1Ñ2ðZ
ð ˜×)Ñ)Ñ*ðZ
ð $ D™>ðZ
ð ' t™nðZ
ð ˜d‘^ðZ
ð 
ˆuÐ+Ð+Ñ	,ôZ
ó ó öZ
rG   r“  c                   ó¦  ^ • \ rS rSrSU 4S jjrS r\\            SS\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\	R                     S	\\	R                     S
\\	R                     S\\	R                     S\\	R                     S\\   S\\   S\\   S\\\4   4S jj5       5       rSrU =r$ )ÚLayoutLMForQuestionAnsweringií  c                 óæ   >• [         TU ]  U5        UR                  U l        [        U5      U l        [
        R                  " UR                  UR                  5      U l        U R                  5         g)z}
has_visual_segment_embedding (`bool`, *optional*, defaults to `True`):
    Whether or not to add visual segment embeddings.
N)
r'   r(   rƒ  rB  r1  r   rŽ   r+   Ú
qa_outputsrF  )rB   rC   Úhas_visual_segment_embeddingrD   s      €rE   r(   Ú%LayoutLMForQuestionAnswering.__init__ï  sU   ø€ ô
 	‰Ñ˜Ô Ø ×+Ñ+ˆŒä% fÓ-ˆŒÜŸ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰ÕrG   c                 óB   • U R                   R                  R                  $ r¯   rj  r   s    rE   rJ  Ú1LayoutLMForQuestionAnswering.get_input_embeddingsý  rl  rG   rQ   rR   rl   rS   r$   rn   rT   Ústart_positionsÚend_positionsr“   rù   rú   r”   c                 óð  • Ub  UOU R                   R                  nU R                  UUUUUUUU
USS9
nUS   nU R                  U5      nUR	                  SSS9u  nnUR                  S5      R                  5       nUR                  S5      R                  5       nSnUb·  U	b´  [        UR                  5       5      S:”  a  UR                  S5      n[        U	R                  5       5      S:”  a  U	R                  S5      n	UR                  S5      nUR                  SU5      nU	R                  SU5      n	[        US9nU" UU5      nU" UU	5      nUU-   S	-  n[        UUUUR                  UR                  S
9$ )aô  
bbox (`torch.LongTensor` of shape `(batch_size, sequence_length, 4)`, *optional*):
    Bounding boxes of each input sequence tokens. Selected in the range `[0,
    config.max_2d_position_embeddings-1]`. Each bounding box should be a normalized version in (x0, y0, x1, y1)
    format, where (x0, y0) corresponds to the position of the upper left corner in the bounding box, and (x1,
    y1) represents the position of the lower right corner. See [Overview](#Overview) for normalization.

Example:

In the example below, we prepare a question + context pair for the LayoutLM model. It will give us a prediction
of what it thinks the answer is (the span of the answer within the texts parsed from the image).

```python
>>> from transformers import AutoTokenizer, LayoutLMForQuestionAnswering
>>> from datasets import load_dataset
>>> import torch

>>> tokenizer = AutoTokenizer.from_pretrained("impira/layoutlm-document-qa", add_prefix_space=True)
>>> model = LayoutLMForQuestionAnswering.from_pretrained("impira/layoutlm-document-qa", revision="1e3ebac")

>>> dataset = load_dataset("nielsr/funsd", split="train")
>>> example = dataset[0]
>>> question = "what's his name?"
>>> words = example["words"]
>>> boxes = example["bboxes"]

>>> encoding = tokenizer(
...     question.split(), words, is_split_into_words=True, return_token_type_ids=True, return_tensors="pt"
... )
>>> bbox = []
>>> for i, s, w in zip(encoding.input_ids[0], encoding.sequence_ids(0), encoding.word_ids(0)):
...     if s == 1:
...         bbox.append(boxes[w])
...     elif i == tokenizer.sep_token_id:
...         bbox.append([1000] * 4)
...     else:
...         bbox.append([0] * 4)
>>> encoding["bbox"] = torch.tensor([bbox])

>>> word_ids = encoding.word_ids(0)
>>> outputs = model(**encoding)
>>> loss = outputs.loss
>>> start_scores = outputs.start_logits
>>> end_scores = outputs.end_logits
>>> start, end = word_ids[start_scores.argmax(-1)], word_ids[end_scores.argmax(-1)]
>>> print(" ".join(words[start : end + 1]))
M. Hamann P. Harper, P. Martinez
```NTrŠ  r   r   r%   rÀ   )Úignore_indexrL   )rw  Ústart_logitsÚ
end_logitsr’   rþ   )rC   rW  r1  r  Úsplitr  r|   rÁ   rM   Úclampr   r   r’   rþ   )rB   rQ   rR   rl   rS   r$   rn   rT   r¢  r£  r“   rù   rú   rŸ   r*  rx  r¦  r§  Ú
total_lossÚignored_indexrz  Ú
start_lossÚend_losss                          rE   r^   Ú$LayoutLMForQuestionAnswering.forward   s—  € ðD &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—-‘-ØØØ)Ø)Ø%ØØ'Ø/Ø!5Øð  ð 
ˆð " !™*ˆà—‘ Ó1ˆØ#)§<¡<°°r <Ð#:Ñ ˆjØ#×+Ñ+¨BÓ/×:Ñ:Ó<ˆØ×'Ñ'¨Ó+×6Ñ6Ó8ˆ
àˆ
ØÑ&¨=Ñ+Dä?×'Ñ'Ó)Ó*¨QÓ.Ø"1×"9Ñ"9¸"Ó"=Ü=×%Ñ%Ó'Ó(¨1Ó,Ø -× 5Ñ 5°bÓ 9à(×-Ñ-¨aÓ0ˆMØ-×3Ñ3°A°}ÓEˆOØ)×/Ñ/°°=ÓAˆMä'°]ÑCˆHÙ! ,°Ó@ˆJÙ 
¨MÓ:ˆHØ$ xÑ/°1Ñ4ˆJä+ØØ%Ø!Ø!×/Ñ/Ø×)Ñ)ñ
ð 	
rG   )r1  rƒ  r  )T)NNNNNNNNNNNN)r`   ra   rb   rc   r(   rJ  r   r   r   r>   rc  r£   r¤   r   r¥   r   r^   re   rf   rg   s   @rE   r›  r›  í  sX  ø† ÷ò8ð Øð 15Ø+/Ø6:Ø59Ø37Ø15Ø59Ø6:Ø48Ø,0Ø/3Ø&*ñm
à˜E×,Ñ,Ñ-ðm
ð u×'Ñ'Ñ(ðm
ð ! ×!2Ñ!2Ñ3ð	m
ð
 ! ×!1Ñ!1Ñ2ðm
ð ˜u×/Ñ/Ñ0ðm
ð ˜E×-Ñ-Ñ.ðm
ð   × 1Ñ 1Ñ2ðm
ð " %×"2Ñ"2Ñ3ðm
ð   × 0Ñ 0Ñ1ðm
ð $ D™>ðm
ð ' t™nðm
ð ˜d‘^ðm
ð 
ˆuÐ2Ð2Ñ	3ôm
ó ó öm
rG   r›  )re  r€  r“  r›  rB  r0  )r—   N)@rd   Útypingr   r   r   r>   Útorch.utils.checkpointr   Útorch.nnr   r   r	   Úactivationsr   Úmodeling_layersr   Úmodeling_outputsr   r   r   r   r   r   Úmodeling_utilsr   r   Úpytorch_utilsr   r   r   Úutilsr   r   r   Úconfiguration_layoutlmr   Ú
get_loggerr`   Úloggerr9   r7   ÚModuler   r¢   Úfloatr   rƒ   r§   r¸   rÍ   rÚ   rà   rð   r  r  r  r&  r0  rB  re  r€  r“  r›  Ú__all__rü   rG   rE   Ú<module>r¾     sw  ðñ ç ,Ñ ,ã Û Ý ß AÑ Aå !Ý 9÷÷ ÷ Gß lÑ lß >Ñ >Ý 2ð 
×	Ò	˜HÓ	%€ð —L‘LÐ ôI˜Ÿ™ô Iðh Ø(,ñ%ØI‰Ið%à<‰<ð%ð 
‰ð%ð <‰<ð	%ð
 ˜UŸ\™\Ñ*ð%ð ð%ð ð%ð ˜Ÿ™Ñ%õ%ô87˜BŸI™Iô 7ôv˜Ÿ™ô ô*˜Ÿ	™	ô *ô\˜2Ÿ9™9ô ô R—Y‘Yô ô%Ð.ô %ôR.
b—i‘iô .
ôdR—Y‘Yô ô  b§i¡iô ô$˜rŸy™yô ô0!˜"Ÿ)™)ô !ð ô%˜oó %ó ð%ð0 ôO
Ð+ó O
ó ðO
ðd ôu
Ð1ó u
ó ðu
ñp ðñô~
Ð(?ó ~
óð~
ñB ðñôj
Ð%<ó j
óðj
ðZ ôA
Ð#:ó A
ó ðA
òHrG   