ó
    <±hš‚ ã                   ól  • S r SSKrSSKJr  SSKJrJr  SSKrSSKrSSKJ	r	  SSK
JrJrJr  SSKJrJr  SS	KJr  SS
KJrJr  SSKJr  SSKJr  SSKJrJrJr  SSKJr  \R@                  " \!5      r"\\" SS9 " S S\5      5       5       r#\\" SS9 " S S\5      5       5       r$\\" SS9 " S S\5      5       5       r%\\" SS9 " S S\5      5       5       r&\\" SS9 " S S\5      5       5       r'\\" SS9 " S  S!\5      5       5       r(\\" S"S9 " S# S$\5      5       5       r)\\" S%S9 " S& S'\5      5       5       r*\\" S(S9 " S) S*\5      5       5       r+\\" S+S9 " S, S-\5      5       5       r, " S. S/\	RZ                  5      r. " S0 S1\	RZ                  5      r/ " S2 S3\	RZ                  5      r0 " S4 S5\	RZ                  5      r1 " S6 S7\	RZ                  5      r2 " S8 S9\	RZ                  5      r3 " S: S;\	RZ                  5      r4 " S< S=\5      r5 " S> S?\	RZ                  5      r6 " S@ SA\	RZ                  5      r7 " SB SC\	RZ                  5      r8 " SD SE\	RZ                  5      r9\ " SF SG\5      5       r:\" SHS9 " SI SJ\:5      5       r;SK r< " SL SM\	RZ                  5      r=\" SNS9 " SO SP\:5      5       r>\" SQS9 " SR SS\:5      5       r?\" STS9 " SU SV\:5      5       r@\" SWS9 " SX SY\:5      5       rA\" SZS9 " S[ S\\:5      5       rB\" S]S9 " S^ S_\:5      5       rC\ " S` Sa\:5      5       rD\ " Sb Sc\:5      5       rE/ SdQrFg)ezPyTorch LUKE model.é    N)Ú	dataclass)ÚOptionalÚUnion)Únn)ÚBCEWithLogitsLossÚCrossEntropyLossÚMSELossé   )ÚACT2FNÚgelu)ÚGradientCheckpointingLayer)ÚBaseModelOutputÚBaseModelOutputWithPooling)ÚPreTrainedModel)Úapply_chunking_to_forward)ÚModelOutputÚauto_docstringÚloggingé   )Ú
LukeConfigz3
    Base class for outputs of the LUKE model.
    )Úcustom_introc                   ót   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\\R                  S4      \	S'   Srg)ÚBaseLukeModelOutputWithPoolingé&   aP  
pooler_output (`torch.FloatTensor` of shape `(batch_size, hidden_size)`):
    Last layer hidden-state of the first token of the sequence (classification token) further processed by a
    Linear layer and a Tanh activation function.
entity_last_hidden_state (`torch.FloatTensor` of shape `(batch_size, entity_length, hidden_size)`):
    Sequence of entity hidden-states at the output of the last layer of the model.
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
NÚentity_last_hidden_state.Úentity_hidden_states© ©Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__r   r   ÚtorchÚFloatTensorÚ__annotations__r   ÚtupleÚ__static_attributes__r   ó    Ú^/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/luke/modeling_luke.pyr   r   &   s@   ‡ ñ
ð =AÐ˜h u×'8Ñ'8Ñ9Ó@ØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÖHr)   r   zV
    Base class for model's outputs, with potential hidden states and attentions.
    c                   ót   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\\R                  S4      \	S'   Srg)ÚBaseLukeModelOutputé=   ah  
entity_last_hidden_state (`torch.FloatTensor` of shape `(batch_size, entity_length, hidden_size)`):
    Sequence of entity hidden-states at the output of the last layer of the model.
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr   .r   r   r   r   r)   r*   r,   r,   =   s@   ‡ ñð =AÐ˜h u×'8Ñ'8Ñ9Ó@ØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÖHr)   r,   c                   ót  • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\R                     \	S'   Sr\\R                     \	S'   Sr\\R                     \	S'   Sr\\\R                        \	S	'   Sr\\\R                  S
4      \	S'   Sr\\\R                  S
4      \	S'   Srg)ÚLukeMaskedLMOutputéQ   aþ  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    The sum of masked language modeling (MLM) loss and entity prediction loss.
mlm_loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Masked language modeling (MLM) loss.
mep_loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Masked entity prediction (MEP) loss.
logits (`torch.FloatTensor` of shape `(batch_size, sequence_length, config.vocab_size)`):
    Prediction scores of the language modeling head (scores for each vocabulary token before SoftMax).
entity_logits (`torch.FloatTensor` of shape `(batch_size, sequence_length, config.vocab_size)`):
    Prediction scores of the entity prediction head (scores for each entity vocabulary token before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
NÚlossÚmlm_lossÚmep_lossÚlogitsÚentity_logitsÚhidden_states.r   Ú
attentionsr   )r   r    r!   r"   r#   r1   r   r$   r%   r&   r2   r3   r4   r5   r6   r'   r   r7   r(   r   r)   r*   r/   r/   Q   sË   ‡ ñð" )-€Dˆ(5×$Ñ$Ñ
%Ó,Ø,0€Hˆhu×(Ñ(Ñ)Ó0Ø,0€Hˆhu×(Ñ(Ñ)Ó0Ø*.€FˆHU×&Ñ&Ñ'Ó.Ø15€M8˜E×-Ñ-Ñ.Ó5Ø8<€M8˜E %×"3Ñ"3Ñ4Ñ5Ó<ØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÓHØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r)   r/   z2
    Outputs of entity classification models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚEntityClassificationOutputés   á›  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Classification loss.
logits (`torch.FloatTensor` of shape `(batch_size, config.num_labels)`):
    Classification scores (before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   r4   .r6   r   r7   r   ©r   r    r!   r"   r#   r1   r   r$   r%   r&   r4   r6   r'   r   r7   r(   r   r)   r*   r9   r9   s   ó‘   ‡ ñ	ð )-€Dˆ(5×$Ñ$Ñ
%Ó,Ø*.€FˆHU×&Ñ&Ñ'Ó.Ø=A€M8˜E %×"3Ñ"3°SÐ"8Ñ9Ñ:ÓAØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÓHØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r)   r9   z7
    Outputs of entity pair classification models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚEntityPairClassificationOutputéŒ   r;   Nr1   r4   .r6   r   r7   r   r<   r   r)   r*   r?   r?   Œ   r=   r)   r?   z7
    Outputs of entity span classification models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚEntitySpanClassificationOutputé¥   aª  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Classification loss.
logits (`torch.FloatTensor` of shape `(batch_size, entity_length, config.num_labels)`):
    Classification scores (before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   r4   .r6   r   r7   r   r<   r   r)   r*   rB   rB   ¥   r=   r)   rB   z4
    Outputs of sentence classification models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚLukeSequenceClassifierOutputé¾   aë  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Classification (or regression if config.num_labels==1) loss.
logits (`torch.FloatTensor` of shape `(batch_size, config.num_labels)`):
    Classification (or regression if config.num_labels==1) scores (before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   r4   .r6   r   r7   r   r<   r   r)   r*   rE   rE   ¾   r=   r)   rE   z@
    Base class for outputs of token classification models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚLukeTokenClassifierOutputé×   a¬  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Classification loss.
logits (`torch.FloatTensor` of shape `(batch_size, sequence_length, config.num_labels)`):
    Classification scores (before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   r4   .r6   r   r7   r   r<   r   r)   r*   rH   rH   ×   r=   r)   rH   z/
    Outputs of question answering models.
    c                   ó(  • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   Sr\\\R                  S4      \	S
'   Srg)Ú LukeQuestionAnsweringModelOutputéð   ak  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `labels` is provided):
    Total span extraction loss is the sum of a Cross-Entropy for the start and end positions.
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   Ústart_logitsÚ
end_logits.r6   r   r7   r   )r   r    r!   r"   r#   r1   r   r$   r%   r&   rM   rN   r6   r'   r   r7   r(   r   r)   r*   rK   rK   ð   s¦   ‡ ñð )-€Dˆ(5×$Ñ$Ñ
%Ó,Ø04€L(˜5×,Ñ,Ñ-Ó4Ø.2€J˜×*Ñ*Ñ+Ó2Ø=A€M8˜E %×"3Ñ"3°SÐ"8Ñ9Ñ:ÓAØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÓHØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r)   rK   z,
    Outputs of multiple choice models.
    c                   ó   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S	'   S
rg)ÚLukeMultipleChoiceModelOutputi  aï  
loss (`torch.FloatTensor` of shape *(1,)*, *optional*, returned when `labels` is provided):
    Classification loss.
logits (`torch.FloatTensor` of shape `(batch_size, num_choices)`):
    *num_choices* is the second dimension of the input tensors. (see *input_ids* above).

    Classification scores (before SoftMax).
entity_hidden_states (`tuple(torch.FloatTensor)`, *optional*, returned when `output_hidden_states=True` is passed or when `config.output_hidden_states=True`):
    Tuple of `torch.FloatTensor` (one for the output of the embeddings + one for the output of each layer) of
    shape `(batch_size, entity_length, hidden_size)`. Entity hidden-states of the model at the output of each
    layer plus the initial entity embedding outputs.
Nr1   r4   .r6   r   r7   r   r<   r   r)   r*   rP   rP     s‘   ‡ ñð )-€Dˆ(5×$Ñ$Ñ
%Ó,Ø*.€FˆHU×&Ñ&Ñ'Ó.Ø=A€M8˜E %×"3Ñ"3°SÐ"8Ñ9Ñ:ÓAØDHÐ˜( 5¨×):Ñ):¸CÐ)?Ñ#@ÑAÓHØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r)   rP   c                   óD   ^ • \ rS rSrSrU 4S jr    SS jrS rSrU =r	$ )ÚLukeEmbeddingsi#  zN
Same as BertEmbeddings with a tiny tweak for positional embeddings indexing.
c                 óŽ  >• [         TU ]  5         [        R                  " UR                  UR
                  UR                  S9U l        [        R                  " UR                  UR
                  5      U l	        [        R                  " UR                  UR
                  5      U l        [        R                  " UR
                  UR                  S9U l        [        R                  " UR                  5      U l        UR                  U l        [        R                  " UR                  UR
                  U R"                  S9U l	        g )N©Úpadding_idx©Úeps)ÚsuperÚ__init__r   Ú	EmbeddingÚ
vocab_sizeÚhidden_sizeÚpad_token_idÚword_embeddingsÚmax_position_embeddingsÚposition_embeddingsÚtype_vocab_sizeÚtoken_type_embeddingsÚ	LayerNormÚlayer_norm_epsÚDropoutÚhidden_dropout_probÚdropoutrU   ©ÚselfÚconfigÚ	__class__s     €r*   rY   ÚLukeEmbeddings.__init__(  så   ø€ Ü‰ÑÔÜ!Ÿ|š|¨F×,=Ñ,=¸v×?QÑ?QÐ_e×_rÑ_rÑsˆÔÜ#%§<¢<°×0NÑ0NÐPV×PbÑPbÓ#cˆÔ Ü%'§\¢\°&×2HÑ2HÈ&×J\ÑJ\Ó%]ˆÔ"ô Ÿš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒð "×.Ñ.ˆÔÜ#%§<¢<Ø×*Ñ*¨F×,>Ñ,>ÈD×L\ÑL\ñ$
ˆÕ r)   c                 ó  • UcC  Ub/  [        XR                  5      R                  UR                  5      nOU R	                  U5      nUb  UR                  5       nOUR                  5       S S nUc8  [        R                  " U[        R                  U R                  R                  S9nUc  U R                  U5      nU R                  U5      nU R                  U5      nXF-   U-   nU R                  U5      nU R                  U5      nU$ )Néÿÿÿÿ©ÚdtypeÚdevice)Ú"create_position_ids_from_input_idsrU   Útorq   Ú&create_position_ids_from_inputs_embedsÚsizer$   ÚzerosÚlongÚposition_idsr^   r`   rb   rc   rg   )	ri   Ú	input_idsÚtoken_type_idsrx   Úinputs_embedsÚinput_shaper`   rb   Ú
embeddingss	            r*   ÚforwardÚLukeEmbeddings.forward9  sù   € ð ÑØÑ$äAÀ)×M]ÑM]Ó^×aÑaÐbk×brÑbrÓs‘à#×JÑJÈ=ÓYàÑ Ø#Ÿ.™.Ó*‰Kà'×,Ñ,Ó.¨s°Ð3ˆKàÑ!Ü"Ÿ[š[¨¼E¿J¹JÈt×O`ÑO`×OgÑOgÑhˆNàÑ Ø ×0Ñ0°Ó;ˆMà"×6Ñ6°|ÓDÐØ $× :Ñ :¸>Ó JÐà"Ñ8Ð;PÑPˆ
Ø—^‘^ JÓ/ˆ
Ø—\‘\ *Ó-ˆ
ØÐr)   c                 ó  • UR                  5       SS nUS   n[        R                  " U R                  S-   X0R                  -   S-   [        R                  UR
                  S9nUR                  S5      R                  U5      $ )z¯
We are provided embeddings directly. We cannot infer which are padded so just generate sequential position ids.

Args:
    inputs_embeds: torch.Tensor

Returns: torch.Tensor
Nrn   r   ro   r   )ru   r$   ÚarangerU   rw   rq   Ú	unsqueezeÚexpand)ri   r{   r|   Úsequence_lengthrx   s        r*   rt   Ú5LukeEmbeddings.create_position_ids_from_inputs_embedsZ  s~   € ð $×(Ñ(Ó*¨3¨BÐ/ˆØ% a™.ˆä—|’|Ø×Ñ˜qÑ  /×4DÑ4DÑ"DÀqÑ"HÔPU×PZÑPZÐcp×cwÑcwñ
ˆð ×%Ñ% aÓ(×/Ñ/°Ó<Ð<r)   )rc   rg   rU   r`   rb   r^   )NNNN)
r   r    r!   r"   r#   rY   r~   rt   r(   Ú__classcell__©rk   s   @r*   rR   rR   #  s+   ø† ñõ
ð& ØØØô÷B=ð =r)   rR   c                   óŽ   ^ • \ rS rSrS\4U 4S jjr S	S\R                  S\R                  S\\R                     4S jjr	Sr
U =r$ )
ÚLukeEntityEmbeddingsil  rj   c                 ó„  >• [         TU ]  5         Xl        [        R                  " UR
                  UR                  SS9U l        UR                  UR                  :w  a/  [        R                  " UR                  UR                  SS9U l
        [        R                  " UR                  UR                  5      U l        [        R                  " UR                  UR                  5      U l        [        R                  " UR                  UR                   S9U l        [        R"                  " UR$                  5      U l        g )Nr   rT   F©ÚbiasrV   )rX   rY   rj   r   rZ   Úentity_vocab_sizeÚentity_emb_sizeÚentity_embeddingsr\   ÚLinearÚentity_embedding_denser_   r`   ra   rb   rc   rd   re   rf   rg   rh   s     €r*   rY   ÚLukeEntityEmbeddings.__init__m  sÞ   ø€ Ü‰ÑÔØŒä!#§¢¨f×.FÑ.FÈ×H^ÑH^ÐlmÑ!nˆÔØ×!Ñ! V×%7Ñ%7Ó7Ü*,¯)ª)°F×4JÑ4JÈF×L^ÑL^ÐejÑ*kˆDÔ'ä#%§<¢<°×0NÑ0NÐPV×PbÑPbÓ#cˆÔ Ü%'§\¢\°&×2HÑ2HÈ&×J\ÑJ\Ó%]ˆÔ"äŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆr)   Ú
entity_idsrx   rz   c                 ó<  • Uc  [         R                  " U5      nU R                  U5      nU R                  R                  U R                  R
                  :w  a  U R                  U5      nU R                  UR                  SS95      nUS:g  R                  U5      R                  S5      nXV-  n[         R                  " USS9nXVR                  SS9R                  SS9-  nU R                  U5      nXE-   U-   nU R                  U5      nU R                  U5      nU$ )Nr   )Úminrn   éþÿÿÿ©ÚdimgH¯¼šò×z>)r$   Ú
zeros_liker   rj   rŽ   r\   r‘   r`   ÚclampÚtype_asr‚   Úsumrb   rc   rg   )	ri   r“   rx   rz   r   r`   Úposition_embedding_maskrb   r}   s	            r*   r~   ÚLukeEntityEmbeddings.forward{  s  € ð Ñ!Ü"×-Ò-¨jÓ9ˆNà ×2Ñ2°:Ó>ÐØ;‰;×&Ñ&¨$¯+©+×*AÑ*AÓAØ $× ;Ñ ;Ð<MÓ NÐà"×6Ñ6°|×7IÑ7IÈaÐ7IÐ7PÓQÐØ#/°2Ñ#5×">Ñ">Ð?RÓ"S×"]Ñ"]Ð^`Ó"aÐØ1ÑKÐÜ#ŸišiÐ(;ÀÑDÐØ1×4OÑ4OÐTVÐ4OÐ4W×4]Ñ4]ÐbfÐ4]Ð4gÑgÐà $× :Ñ :¸>Ó JÐà&Ñ<Ð?TÑTˆ
Ø—^‘^ JÓ/ˆ
Ø—\‘\ *Ó-ˆ
àÐr)   )rc   rj   rg   r‘   r   r`   rb   ©N)r   r    r!   r"   r   rY   r$   Ú
LongTensorr   r~   r(   r†   r‡   s   @r*   r‰   r‰   l  sQ   ø† ð>˜z÷ >ð$ 6:ñ	à×$Ñ$ðð ×&Ñ&ðð ! ×!1Ñ!1Ñ2÷	ó r)   r‰   c                   ó>   ^ • \ rS rSrU 4S jrS r   SS jrSrU =r$ )ÚLukeSelfAttentioni—  c                 óD  >• [         TU ]  5         UR                  UR                  -  S:w  a7  [	        US5      (       d&  [        SUR                   SUR                   S35      eUR                  U l        [        UR                  UR                  -  5      U l        U R                  U R                  -  U l        UR                  U l	        [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        U R                  (       a  [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        [        R                  " UR                  U R                  5      U l        [        R$                  " UR&                  5      U l        g )Nr   Úembedding_sizezThe hidden size z4 is not a multiple of the number of attention heads Ú.)rX   rY   r\   Únum_attention_headsÚhasattrÚ
ValueErrorÚintÚattention_head_sizeÚall_head_sizeÚuse_entity_aware_attentionr   r   ÚqueryÚkeyÚvalueÚ	w2e_queryÚ	e2w_queryÚ	e2e_queryre   Úattention_probs_dropout_probrg   rh   s     €r*   rY   ÚLukeSelfAttention.__init__˜  s  ø€ Ü‰ÑÔØ×Ñ × :Ñ :Ñ:¸aÓ?ÌÐPVÐXh×HiÑHiÜØ" 6×#5Ñ#5Ð"6ð 7Ø×3Ñ3Ð4°Að7óð ð
 $*×#=Ñ#=ˆÔ Ü#& v×'9Ñ'9¸F×<VÑ<VÑ'VÓ#WˆÔ Ø!×5Ñ5¸×8PÑ8PÑPˆÔØ*0×*KÑ*KˆÔ'ä—Y’Y˜v×1Ñ1°4×3EÑ3EÓFˆŒ
Ü—9’9˜V×/Ñ/°×1CÑ1CÓDˆŒÜ—Y’Y˜v×1Ñ1°4×3EÑ3EÓFˆŒ
à×*×*ÜŸYšY v×'9Ñ'9¸4×;MÑ;MÓNˆDŒNÜŸYšY v×'9Ñ'9¸4×;MÑ;MÓNˆDŒNÜŸYšY v×'9Ñ'9¸4×;MÑ;MÓNˆDŒNä—z’z &×"EÑ"EÓFˆr)   c                 ó    • UR                  5       S S U R                  U R                  4-   nUR                  " U6 nUR	                  SSSS5      $ )Nrn   r   é   r   r
   )ru   r¦   rª   ÚviewÚpermute)ri   ÚxÚnew_x_shapes      r*   Útranspose_for_scoresÚ&LukeSelfAttention.transpose_for_scores°  sL   € Ø—f‘f“h˜s m t×'?Ñ'?À×AYÑAYÐ&ZÑZˆØFŠFKÐ ˆØy‰y˜˜A˜q !Ó$Ð$r)   c                 óà  • UR                  S5      nUc  UnO[        R                  " X/SS9nU R                  U R	                  U5      5      nU R                  U R                  U5      5      n	U R                  (       Ga¨  UGb¤  U R                  U R                  U5      5      n
U R                  U R                  U5      5      nU R                  U R                  U5      5      nU R                  U R                  U5      5      nUS S 2S S 2S U2S S 24   nUS S 2S S 2S U2S S 24   nUS S 2S S 2US 2S S 24   nUS S 2S S 2US 2S S 24   n[        R                  " X®R                  SS5      5      n[        R                  " UUR                  SS5      5      n[        R                  " XÏR                  SS5      5      n[        R                  " UUR                  SS5      5      n[        R                  " UU/SS9n[        R                  " UU/SS9n[        R                  " UU/SS9nOGU R                  U R                  U5      5      n[        R                  " UUR                  SS5      5      nU[        R                  " U R                  5      -  nUb  UU-   n[         R"                  R%                  USS9nU R'                  U5      nUb  UU-  n[        R                  " UU	5      nUR)                  SSSS5      R+                  5       nUR                  5       S S U R,                  4-   nUR.                  " U6 nUS S 2S U2S S 24   nUc  S nOUS S 2US 2S S 24   nU(       a  UUU4nU$ UU4nU$ )Nr   r—   rn   r–   r
   r¶   r   )ru   r$   Úcatr»   r®   r¯   r¬   r­   r°   r±   r²   ÚmatmulÚ	transposeÚmathÚsqrtrª   r   Ú
functionalÚsoftmaxrg   r¸   Ú
contiguousr«   r·   ) ri   Úword_hidden_statesr   Úattention_maskÚ	head_maskÚoutput_attentionsÚ	word_sizeÚconcat_hidden_statesÚ	key_layerÚvalue_layerÚw2w_query_layerÚw2e_query_layerÚe2w_query_layerÚe2e_query_layerÚw2w_key_layerÚe2w_key_layerÚw2e_key_layerÚe2e_key_layerÚw2w_attention_scoresÚw2e_attention_scoresÚe2w_attention_scoresÚe2e_attention_scoresÚword_attention_scoresÚentity_attention_scoresÚattention_scoresÚquery_layerÚattention_probsÚcontext_layerÚnew_context_layer_shapeÚoutput_word_hidden_statesÚoutput_entity_hidden_statesÚoutputss                                    r*   r~   ÚLukeSelfAttention.forwardµ  sr  € ð '×+Ñ+¨AÓ.ˆ	àÑ'Ø#5Ñ ä#(§9¢9Ð.@Ð-WÐ]^Ñ#_Ð à×-Ñ-¨d¯h©hÐ7KÓ.LÓMˆ	Ø×/Ñ/°·
±
Ð;OÓ0PÓQˆà×*×*Ð*Ð/CÒ/Oð #×7Ñ7¸¿
¹
ÐCUÓ8VÓWˆOØ"×7Ñ7¸¿¹ÐGYÓ8ZÓ[ˆOØ"×7Ñ7¸¿¹ÐG[Ó8\Ó]ˆOØ"×7Ñ7¸¿¹ÐG[Ó8\Ó]ˆOð &¢aª¨J¨Y¨JºÐ&9Ñ:ˆMØ%¢aª¨J¨Y¨JºÐ&9Ñ:ˆMØ%¢aª¨I©JºÐ&9Ñ:ˆMØ%¢aª¨I©JºÐ&9Ñ:ˆMô $)§<¢<°×AXÑAXÐY[Ð]_ÓA`Ó#aÐ Ü#(§<¢<°À×AXÑAXÐY[Ð]_ÓA`Ó#aÐ Ü#(§<¢<°×AXÑAXÐY[Ð]_ÓA`Ó#aÐ Ü#(§<¢<°À×AXÑAXÐY[Ð]_ÓA`Ó#aÐ ô %*§I¢IÐ/CÐEYÐ.ZÐ`aÑ$bÐ!Ü&+§i¢iÐ1EÐG[Ð0\ÐbcÑ&dÐ#Ü$ŸyšyÐ*?ÐAXÐ)YÐ_`ÑaÑð ×3Ñ3°D·J±JÐ?SÓ4TÓUˆKÜ$Ÿ|š|¨K¸×9LÑ9LÈRÐQSÓ9TÓUÐà+¬d¯iªi¸×8PÑ8PÓ.QÑQÐØÑ%à/°.Ñ@Ðô Ÿ-™-×/Ñ/Ð0@ÀbÐ/ÐIˆð Ÿ,™, Ó7ˆð Ñ Ø-°	Ñ9ˆOäŸš _°kÓBˆà%×-Ñ-¨a°°A°qÓ9×DÑDÓFˆØ"/×"4Ñ"4Ó"6°s¸Ð";¸t×?QÑ?QÐ>SÑ"SÐØ%×*Ò*Ð,CÐDˆà$1²!°Z°i°ZÂÐ2BÑ$CÐ!ØÑ'Ø*.Ñ'à*7º¸9¹:ÂqÐ8HÑ*IÐ'æØ0Ð2MÈÐ_ˆGð ˆð 1Ð2MÐNˆGàˆr)   )r«   rª   rg   r²   r±   r®   r¦   r­   r¬   r¯   r°   ©NNF)	r   r    r!   r"   rY   r»   r~   r(   r†   r‡   s   @r*   r¢   r¢   —  s%   ø† õGò0%ð ØØ÷Pò Pr)   r¢   c                   óz   ^ • \ rS rSrU 4S jrS\R                  S\R                  S\R                  4S jrSrU =r	$ )ÚLukeSelfOutputi	  c                 ó(  >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        R                  " UR                  UR                  S9U l        [        R                  " UR                  5      U l
        g ©NrV   )rX   rY   r   r   r\   Údenserc   rd   re   rf   rg   rh   s     €r*   rY   ÚLukeSelfOutput.__init__
  s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
ÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆr)   r6   Úinput_tensorÚreturnc                 óp   • U R                  U5      nU R                  U5      nU R                  X-   5      nU$ rŸ   ©rê   rg   rc   ©ri   r6   rì   s      r*   r~   ÚLukeSelfOutput.forward  ó5   € ØŸ
™
 =Ó1ˆØŸ™ ]Ó3ˆØŸ™ }Ñ'CÓDˆØÐr)   ©rc   rê   rg   ©
r   r    r!   r"   rY   r$   ÚTensorr~   r(   r†   r‡   s   @r*   rç   rç   	  ó6   ø† õ>ð U§\¡\ð ÀÇÁð ÐRW×R^ÑR^÷ ò r)   rç   c                   ó>   ^ • \ rS rSrU 4S jrS r   SS jrSrU =r$ )ÚLukeAttentioni  c                 ó€   >• [         TU ]  5         [        U5      U l        [	        U5      U l        [        5       U l        g rŸ   )rX   rY   r¢   ri   rç   ÚoutputÚsetÚpruned_headsrh   s     €r*   rY   ÚLukeAttention.__init__  s0   ø€ Ü‰ÑÔÜ% fÓ-ˆŒ	Ü$ VÓ,ˆŒÜ›EˆÕr)   c                 ó   • [        S5      e©Nz4LUKE does not support the pruning of attention heads©ÚNotImplementedError)ri   Úheadss     r*   Úprune_headsÚLukeAttention.prune_heads  ó   € Ü!Ð"XÓYÐYr)   c                 ó<  • UR                  S5      nU R                  UUUUU5      nUc  US   nUn	O.[        R                  " US S SS9n[        R                  " X/SS9n	U R	                  X‰5      n
U
S S 2S U2S S 24   nUc  S nOU
S S 2US 2S S 24   nX¼4USS  -   nU$ )Nr   r   r¶   r—   )ru   ri   r$   r¾   rú   )ri   rÆ   r   rÇ   rÈ   rÉ   rÊ   Úself_outputsÚconcat_self_outputsrË   Úattention_outputÚword_attention_outputÚentity_attention_outputrã   s                 r*   r~   ÚLukeAttention.forward!  sÚ   € ð '×+Ñ+¨AÓ.ˆ	Ø—y‘yØØ ØØØó
ˆð  Ñ'Ø".¨q¡/ÐØ#5Ñ ä"'§)¢)¨L¸¸!Ð,<À!Ñ"DÐÜ#(§9¢9Ð.@Ð-WÐ]^Ñ#_Ð àŸ;™;Ð':ÓQÐà 0²°J°Y°JÂÐ1AÑ BÐØÑ'Ø&*Ñ#à&6²q¸)¹*ÂaÐ7GÑ&HÐ#ð )ÐBÀ\ÐRSÐRTÐEUÑUˆàˆr)   )rú   rü   ri   rå   )	r   r    r!   r"   rY   r  r~   r(   r†   r‡   s   @r*   rø   rø     s#   ø† õ"òZð ØØ÷"ò "r)   rø   c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )ÚLukeIntermediateiG  c                 ó  >• [         TU ]  5         [        R                  " UR                  UR
                  5      U l        [        UR                  [        5      (       a  [        UR                     U l        g UR                  U l        g rŸ   )rX   rY   r   r   r\   Úintermediate_sizerê   Ú
isinstanceÚ
hidden_actÚstrr   Úintermediate_act_fnrh   s     €r*   rY   ÚLukeIntermediate.__init__H  s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3KÑ3KÓLˆŒ
Üf×'Ñ'¬×-Ñ-Ü'-¨f×.?Ñ.?Ñ'@ˆDÕ$à'-×'8Ñ'8ˆDÕ$r)   r6   rí   c                 óJ   • U R                  U5      nU R                  U5      nU$ rŸ   ©rê   r  ©ri   r6   s     r*   r~   ÚLukeIntermediate.forwardP  s&   € ØŸ
™
 =Ó1ˆØ×0Ñ0°Ó?ˆØÐr)   r  rô   r‡   s   @r*   r  r  G  s(   ø† õ9ð U§\¡\ð °e·l±l÷ ò r)   r  c                   óz   ^ • \ rS rSrU 4S jrS\R                  S\R                  S\R                  4S jrSrU =r	$ )Ú
LukeOutputiW  c                 ó(  >• [         TU ]  5         [        R                  " UR                  UR
                  5      U l        [        R                  " UR
                  UR                  S9U l        [        R                  " UR                  5      U l        g ré   )rX   rY   r   r   r  r\   rê   rc   rd   re   rf   rg   rh   s     €r*   rY   ÚLukeOutput.__init__X  s`   ø€ Ü‰ÑÔÜ—Y’Y˜v×7Ñ7¸×9KÑ9KÓLˆŒ
ÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ—z’z &×"<Ñ"<Ó=ˆr)   r6   rì   rí   c                 óp   • U R                  U5      nU R                  U5      nU R                  X-   5      nU$ rŸ   rï   rð   s      r*   r~   ÚLukeOutput.forward^  rò   r)   ró   rô   r‡   s   @r*   r  r  W  rö   r)   r  c                   ó>   ^ • \ rS rSrU 4S jr   SS jrS rSrU =r$ )Ú	LukeLayerie  c                 ó²   >• [         TU ]  5         UR                  U l        SU l        [	        U5      U l        [        U5      U l        [        U5      U l	        g ©Nr   )
rX   rY   Úchunk_size_feed_forwardÚseq_len_dimrø   Ú	attentionr  Úintermediater  rú   rh   s     €r*   rY   ÚLukeLayer.__init__f  sI   ø€ Ü‰ÑÔØ'-×'EÑ'EˆÔ$ØˆÔÜ& vÓ.ˆŒÜ,¨VÓ4ˆÔÜ  Ó(ˆr)   c                 óB  • UR                  S5      nU R                  UUUUUS9nUc  US   nO[        R                  " US S SS9nUSS  n	[	        U R
                  U R                  U R                  U5      n
U
S S 2S U2S S 24   nUc  S nOU
S S 2US 2S S 24   nX¼4U	-   n	U	$ )Nr   )rÉ   r   r¶   r—   )ru   r&  r$   r¾   r   Úfeed_forward_chunkr$  r%  )ri   rÆ   r   rÇ   rÈ   rÉ   rÊ   Úself_attention_outputsÚconcat_attention_outputrã   Úlayer_outputÚword_layer_outputÚentity_layer_outputs                r*   r~   ÚLukeLayer.forwardn  sà   € ð '×+Ñ+¨AÓ.ˆ	à!%§¡ØØ ØØØ/ð "0ð "
Ðð  Ñ'Ø&<¸QÑ&?Ñ#ä&+§i¢iÐ0FÀrÈÐ0JÐPQÑ&RÐ#à(¨¨Ð,ˆä0Ø×#Ñ# T×%AÑ%AÀ4×CSÑCSÐUló
ˆð )ª¨J¨Y¨JºÐ)9Ñ:ÐØÑ'Ø"&Ñà".ªq°)±*ºaÐ/?Ñ"@Ðà$Ð:¸WÑDˆàˆr)   c                 óJ   • U R                  U5      nU R                  X!5      nU$ rŸ   )r'  rú   )ri   r	  Úintermediate_outputr-  s       r*   r*  ÚLukeLayer.feed_forward_chunk“  s)   € Ø"×/Ñ/Ð0@ÓAÐØ—{‘{Ð#6ÓIˆØÐr)   )r&  r$  r'  rú   r%  rå   )	r   r    r!   r"   rY   r~   r*  r(   r†   r‡   s   @r*   r!  r!  e  s#   ø† õ)ð ØØô#÷Jð r)   r!  c                   ó<   ^ • \ rS rSrU 4S jr     SS jrSrU =r$ )ÚLukeEncoderi™  c                 óÔ   >• [         TU ]  5         Xl        [        R                  " [        UR                  5       Vs/ sH  n[        U5      PM     sn5      U l        SU l	        g s  snf )NF)
rX   rY   rj   r   Ú
ModuleListÚrangeÚnum_hidden_layersr!  ÚlayerÚgradient_checkpointing)ri   rj   Ú_rk   s      €r*   rY   ÚLukeEncoder.__init__š  sR   ø€ Ü‰ÑÔØŒÜ—]’]¼uÀV×E]ÑE]Ô?^Ó#_Ñ?^¸!¤I¨fÖ$5Ñ?^Ñ#_Ó`ˆŒ
Ø&+ˆÕ#ùò $`s   ½A%c                 ó€  • U(       a  SOS nU(       a  SOS n	U(       a  SOS n
[        U R                  5       HI  u  p¼U(       a
  X4-   nX’4-   n	Ub  XK   OS nU" UUUUU5      nUS   nUb  US   nU(       d  MA  X®S   4-   n
MK     U(       a
  X4-   nX’4-   n	U(       d  [        S UUU
UU	4 5       5      $ [        UUU
UU	S9$ )Nr   r   r   r¶   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   ©Ú.0Úvs     r*   Ú	<genexpr>Ú&LukeEncoder.forward.<locals>.<genexpr>É  ó"   é € ð 
ñAð ÷ ‘òùó   ‚Œ	)Úlast_hidden_stater6   r7   r   r   )Ú	enumerater:  r'   r,   )ri   rÆ   r   rÇ   rÈ   rÉ   Úoutput_hidden_statesÚreturn_dictÚall_word_hidden_statesÚall_entity_hidden_statesÚall_self_attentionsÚiÚlayer_moduleÚlayer_head_maskÚlayer_outputss                  r*   r~   ÚLukeEncoder.forward   s  € ö (<¡ÀÐÞ)=¡2À4Ð Þ$5™b¸4Ðä(¨¯©Ö4‰OˆAÞ#Ø)?ÐBWÑ)WÐ&Ø+CÐF]Ñ+]Ð(à.7Ñ.C˜išlÈˆOÙ(Ø"Ø$ØØØ!óˆMð "/¨qÑ!1Ðà#Ñ/Ø'4°QÑ'7Ð$ç Ð Ø&9È1Ñ=MÐ<OÑ&OÒ#ñ)  5ö,  Ø%;Ð>SÑ%SÐ"Ø'?ÐBYÑ'YÐ$æÜñ 
ð 'Ø*Ø'Ø(Ø,ñó
ó 
ð 
ô #Ø0Ø0Ø*Ø%9Ø!9ñ
ð 	
r)   )rj   r;  r:  )NNFFT©r   r    r!   r"   rY   r~   r(   r†   r‡   s   @r*   r5  r5  ™  s#   ø† õ,ð ØØØ"Ø÷:
ò :
r)   r5  c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )Ú
LukePooleriÞ  c                 ó¶   >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        R                  " 5       U l        g rŸ   )rX   rY   r   r   r\   rê   ÚTanhÚ
activationrh   s     €r*   rY   ÚLukePooler.__init__ß  s9   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
ÜŸ'š'›)ˆr)   r6   rí   c                 ó\   • US S 2S4   nU R                  U5      nU R                  U5      nU$ )Nr   )rê   rX  )ri   r6   Úfirst_token_tensorÚpooled_outputs       r*   r~   ÚLukePooler.forwardä  s6   € ð +ª1¨a¨4Ñ0ÐØŸ
™
Ð#5Ó6ˆØŸ™¨Ó6ˆØÐr)   )rX  rê   rô   r‡   s   @r*   rU  rU  Þ  s(   ø† õ$ð
 U§\¡\ð °e·l±l÷ ò r)   rU  c                   ó.   ^ • \ rS rSrU 4S jrS rSrU =r$ )ÚEntityPredictionHeadTransformií  c                 óp  >• [         TU ]  5         [        R                  " UR                  UR
                  5      U l        [        UR                  [        5      (       a  [        UR                     U l        OUR                  U l        [        R                  " UR
                  UR                  S9U l        g ré   )rX   rY   r   r   r\   rŽ   rê   r  r  r  r   Útransform_act_fnrc   rd   rh   s     €r*   rY   Ú&EntityPredictionHeadTransform.__init__î  s~   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3IÑ3IÓJˆŒ
Üf×'Ñ'¬×-Ñ-Ü$*¨6×+<Ñ+<Ñ$=ˆDÕ!à$*×$5Ñ$5ˆDÔ!ÜŸš f×&<Ñ&<À&×BWÑBWÑXˆr)   c                 ól   • U R                  U5      nU R                  U5      nU R                  U5      nU$ rŸ   )rê   ra  rc   r  s     r*   r~   Ú%EntityPredictionHeadTransform.forward÷  s4   € ØŸ
™
 =Ó1ˆØ×-Ñ-¨mÓ<ˆØŸ™ }Ó5ˆØÐr)   )rc   rê   ra  rS  r‡   s   @r*   r_  r_  í  s   ø† õY÷ð r)   r_  c                   ó.   ^ • \ rS rSrU 4S jrS rSrU =r$ )ÚEntityPredictionHeadiþ  c                 ó  >• [         TU ]  5         Xl        [        U5      U l        [
        R                  " UR                  UR                  SS9U l	        [
        R                  " [        R                  " UR                  5      5      U l        g )NFr‹   )rX   rY   rj   r_  Ú	transformr   r   rŽ   r   ÚdecoderÚ	Parameterr$   rv   rŒ   rh   s     €r*   rY   ÚEntityPredictionHead.__init__ÿ  s_   ø€ Ü‰ÑÔØŒÜ6°vÓ>ˆŒÜ—y’y ×!7Ñ!7¸×9QÑ9QÐX]Ñ^ˆŒÜ—L’L¤§¢¨V×-EÑ-EÓ!FÓGˆ	r)   c                 ód   • U R                  U5      nU R                  U5      U R                  -   nU$ rŸ   )rh  ri  rŒ   r  s     r*   r~   ÚEntityPredictionHead.forward  s-   € ØŸ™ }Ó5ˆØŸ™ ]Ó3°d·i±iÑ?ˆàÐr)   )rŒ   rj   ri  rh  rS  r‡   s   @r*   rf  rf  þ  s   ø† õH÷ð r)   rf  c                   óR   • \ rS rSr% \\S'   SrSrSS/rS\	R                  4S jrS	rg
)ÚLukePreTrainedModeli  rj   ÚlukeTrø   r‰   Úmodulec                 ó‚  • [        U[        R                  5      (       ak  UR                  R                  R                  SU R                  R                  S9  UR                  b%  UR                  R                  R                  5         gg[        U[        R                  5      (       a­  UR                  S:X  a%  UR                  R                  R                  5         O8UR                  R                  R                  SU R                  R                  S9  UR                  b2  UR                  R                  UR                     R                  5         gg[        U[        R                  5      (       aJ  UR                  R                  R                  5         UR                  R                  R                  S5        gg)zInitialize the weightsg        )ÚmeanÚstdNr   ç      ð?)r  r   r   ÚweightÚdataÚnormal_rj   Úinitializer_rangerŒ   Úzero_rZ   Úembedding_dimrU   rc   Úfill_)ri   rq  s     r*   Ú_init_weightsÚ!LukePreTrainedModel._init_weights  s1  € äfœbŸi™i×(Ñ(ØM‰M×Ñ×&Ñ&¨C°T·[±[×5RÑ5RÐ&ÑSØ{‰{Ñ&Ø—‘× Ñ ×&Ñ&Õ(ð 'ä˜¤§¡×-Ñ-Ø×#Ñ# qÓ(Ø—‘×"Ñ"×(Ñ(Õ*à—‘×"Ñ"×*Ñ*°¸¿¹×9VÑ9VÐ*ÑWØ×!Ñ!Ñ-Ø—‘×"Ñ" 6×#5Ñ#5Ñ6×<Ñ<Õ>ð .ä˜¤§¡×-Ñ-ØK‰K×Ñ×"Ñ"Ô$ØM‰M×Ñ×$Ñ$ SÕ)ð .r)   r   N)r   r    r!   r"   r   r&   Úbase_model_prefixÚsupports_gradient_checkpointingÚ_no_split_modulesr   ÚModuler}  r(   r   r)   r*   ro  ro    s0   ‡ àÓØÐØ&*Ð#Ø(Ð*@ÐAÐð* B§I¡I÷ *r)   ro  zt
    The bare LUKE model transformer outputting raw hidden-states for both word tokens and entities without any
    c                    ó   ^ • \ rS rSrSS\S\4U 4S jjjrS rS rS r	S r
S	 r\             SS
\\R                     S\\R                      S\\R                     S\\R                     S\\R                     S\\R                      S\\R                     S\\R                     S\\R                      S\\R                      S\\   S\\   S\\   S\\\4   4S jj5       rS\R                  S\\R                     4S jrSrU =r$ )Ú	LukeModeli&  rj   Úadd_pooling_layerc                 óâ   >• [         TU ]  U5        Xl        [        U5      U l        [        U5      U l        [        U5      U l        U(       a  [        U5      OSU l
        U R                  5         g)z^
add_pooling_layer (bool, *optional*, defaults to `True`):
    Whether to add a pooling layer
N)rX   rY   rj   rR   r}   r‰   r   r5  ÚencoderrU  ÚpoolerÚ	post_init)ri   rj   r…  rk   s      €r*   rY   ÚLukeModel.__init__,  sX   ø€ ô
 	‰Ñ˜Ô ØŒä(¨Ó0ˆŒÜ!5°fÓ!=ˆÔÜ" 6Ó*ˆŒæ,=”j Ô(À4ˆŒð 	‰Õr)   c                 ó.   • U R                   R                  $ rŸ   ©r}   r^   ©ri   s    r*   Úget_input_embeddingsÚLukeModel.get_input_embeddings=  s   € Ø‰×.Ñ.Ð.r)   c                 ó$   • XR                   l        g rŸ   rŒ  ©ri   r¯   s     r*   Úset_input_embeddingsÚLukeModel.set_input_embeddings@  s   € Ø*/‰Õ'r)   c                 ó.   • U R                   R                   $ rŸ   ©r   r  s    r*   Úget_entity_embeddingsÚLukeModel.get_entity_embeddingsC  s   € Ø×%Ñ%×7Ñ7Ð7r)   c                 ó$   • XR                   l         g rŸ   r•  r‘  s     r*   Úset_entity_embeddingsÚLukeModel.set_entity_embeddingsF  s   € Ø38×ÑÕ0r)   c                 ó   • [        S5      erÿ   r   )ri   Úheads_to_prunes     r*   Ú_prune_headsÚLukeModel._prune_headsI  r  r)   ry   rÇ   rz   rx   r“   Úentity_attention_maskÚentity_token_type_idsÚentity_position_idsrÈ   r{   rÉ   rI  rJ  rí   c           
      ó†  • Ub  UOU R                   R                  nUb  UOU R                   R                  nUb  UOU R                   R                  nUb  U
b  [	        S5      eUb"  U R                  X5        UR                  5       nO"U
b  U
R                  5       SS nO[	        S5      eUu  nnUb  UR                  OU
R                  nUc  [        R                  " UU4US9nUc$  [        R                  " U[        R                  US9nUbT  UR                  S5      nUc  [        R                  " UU4US9nUc&  [        R                  " UU4[        R                  US9nU R                  XR                   R                  5      n	U R                  UUUU
S9nU R                  X&5      nUc  SnOU R!                  XXU5      nU R#                  UUUU	UUUS	9nUS
   nU R$                  b  U R%                  U5      OSnU(       d
  UU4USS -   $ ['        UUUR(                  UR*                  UR,                  UR.                  S9$ )u
  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.

Examples:

```python
>>> from transformers import AutoTokenizer, LukeModel

>>> tokenizer = AutoTokenizer.from_pretrained("studio-ousia/luke-base")
>>> model = LukeModel.from_pretrained("studio-ousia/luke-base")
# Compute the contextualized entity representation corresponding to the entity mention "BeyoncÃ©"

>>> text = "BeyoncÃ© lives in Los Angeles."
>>> entity_spans = [(0, 7)]  # character-based entity span corresponding to "BeyoncÃ©"

>>> encoding = tokenizer(text, entity_spans=entity_spans, add_prefix_space=True, return_tensors="pt")
>>> outputs = model(**encoding)
>>> word_last_hidden_state = outputs.last_hidden_state
>>> entity_last_hidden_state = outputs.entity_last_hidden_state
# Input Wikipedia entities to obtain enriched contextualized representations of word tokens

>>> text = "BeyoncÃ© lives in Los Angeles."
>>> entities = [
...     "BeyoncÃ©",
...     "Los Angeles",
... ]  # Wikipedia entity titles corresponding to the entity mentions "BeyoncÃ©" and "Los Angeles"
>>> entity_spans = [
...     (0, 7),
...     (17, 28),
... ]  # character-based entity spans corresponding to "BeyoncÃ©" and "Los Angeles"

>>> encoding = tokenizer(
...     text, entities=entities, entity_spans=entity_spans, add_prefix_space=True, return_tensors="pt"
... )
>>> outputs = model(**encoding)
>>> word_last_hidden_state = outputs.last_hidden_state
>>> entity_last_hidden_state = outputs.entity_last_hidden_state
```NzDYou cannot specify both input_ids and inputs_embeds at the same timern   z5You have to specify either input_ids or inputs_embeds)rq   ro   r   )ry   rx   rz   r{   )rÇ   rÈ   rÉ   rI  rJ  r   )rG  Úpooler_outputr6   r7   r   r   )rj   rÉ   rI  Úuse_return_dictr¨   Ú%warn_if_padding_and_no_attention_maskru   rq   r$   Úonesrv   rw   Úget_head_maskr9  r}   Úget_extended_attention_maskr   r‡  rˆ  r   r6   r7   r   r   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rÉ   rI  rJ  r|   Ú
batch_sizeÚ
seq_lengthrq   Úentity_seq_lengthÚword_embedding_outputÚextended_attention_maskÚentity_embedding_outputÚencoder_outputsÚsequence_outputr\  s                            r*   r~   ÚLukeModel.forwardL  sz  € ðR 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆàÑ  ]Ñ%>ÜÐcÓdÐdØÑ"Ø×6Ñ6°yÔQØ#Ÿ.™.Ó*‰KØÑ&Ø'×,Ñ,Ó.¨s°Ð3‰KäÐTÓUÐUà!,Ñˆ
JØ%.Ñ%:×!Ò!À×@TÑ@TˆàÑ!Ü"ŸZšZ¨°ZÐ(@ÈÑPˆNØÑ!Ü"Ÿ[š[¨¼E¿J¹JÈvÑVˆNØÑ!Ø *§¡°Ó 2ÐØ$Ñ,Ü(-¯
ª
°JÐ@QÐ3RÐ[aÑ(bÐ%Ø$Ñ,Ü(-¯ª°ZÐARÐ4SÔ[`×[eÑ[eÐntÑ(uÐ%ð ×&Ñ& y·+±+×2OÑ2OÓPˆ	ð !%§¡ØØ%Ø)Ø'ð	 !0ð !
Ðð #'×"BÑ"BÀ>Ó"iÐð ÑØ&*Ñ#à&*×&<Ñ&<¸ZÐ^sÓ&tÐ#ð Ÿ,™,Ø!Ø#Ø2ØØ/Ø!5Ø#ð 'ð 
ˆð *¨!Ñ,ˆð 9=¿¹Ñ8O˜Ÿ™ OÔ4ÐUYˆæØ# ]Ð3°oÀaÀbÐ6IÑIÐIä-Ø-Ø'Ø)×7Ñ7Ø&×1Ñ1Ø%4×%MÑ%MØ!0×!EÑ!Eñ
ð 	
r)   Úword_attention_maskc                 óŒ  • UnUb  [         R                  " X2/SS9nUR                  5       S:X  a  USS2SSS2SS24   nO;UR                  5       S:X  a  USS2SSSS24   nO[        SUR                   S35      eUR                  U R                  S9nS	U-
  [         R                  " U R                  5      R                  -  nU$ )
a  
Makes broadcastable attention and causal masks so that future and masked tokens are ignored.

Arguments:
    word_attention_mask (`torch.LongTensor`):
        Attention mask for word tokens with ones indicating tokens to attend to, zeros for tokens to ignore.
    entity_attention_mask (`torch.LongTensor`, *optional*):
        Attention mask for entity tokens with ones indicating tokens to attend to, zeros for tokens to ignore.

Returns:
    `torch.Tensor` The extended attention mask, with a the same dtype as `attention_mask.dtype`.
Nrn   r—   r
   r¶   z&Wrong shape for attention_mask (shape Ú))rp   ru  )	r$   r¾   r˜   r¨   Úshapers   rp   Úfinfor•   )ri   r²  rŸ  rÇ   r­  s        r*   r¨  Ú%LukeModel.get_extended_attention_maskè  sÎ   € ð -ˆØ Ñ,Ü"ŸYšY¨Ð'NÐTVÑWˆNà×ÑÓ 1Ó$Ø&4²Q¸ºaÂ°]Ñ&CÑ#Ø×ÑÓ! QÓ&Ø&4²Q¸¸dÂAÐ5EÑ&FÑ#äÐEÀn×FZÑFZÐE[Ð[\Ð]Ó^Ð^à"9×"<Ñ"<À4Ç:Á:Ð"<Ð"NÐØ#&Ð)@Ñ#@ÄEÇKÂKÐPT×PZÑPZÓD[×D_ÑD_Ñ"_ÐØ&Ð&r)   )rj   r}   r‡  r   rˆ  )T)NNNNNNNNNNNNN)r   r    r!   r"   r   ÚboolrY   rŽ  r’  r–  r™  r  r   r   r$   r    r%   r   r'   r   r~   r¨  r(   r†   r‡   s   @r*   r„  r„  &  s¾  ø† ñ˜zð ¸d÷ ð ò"/ò0ò8ò9òZð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø,0Ø/3Ø&*ñY
à˜E×,Ñ,Ñ-ðY
ð ! ×!2Ñ!2Ñ3ðY
ð ! ×!1Ñ!1Ñ2ð	Y
ð
 ˜u×/Ñ/Ñ0ðY
ð ˜U×-Ñ-Ñ.ðY
ð  (¨×(9Ñ(9Ñ:ðY
ð  (¨×(8Ñ(8Ñ9ðY
ð & e×&6Ñ&6Ñ7ðY
ð ˜E×-Ñ-Ñ.ðY
ð   × 1Ñ 1Ñ2ðY
ð $ D™>ðY
ð ' t™nðY
ð ˜d‘^ðY
ð 
ˆuÐ4Ð4Ñ	5ôY
ó ðY
ðv'Ø#(×#3Ñ#3ð'ØLTÐUZ×UeÑUeÑLf÷'ò 'r)   r„  c                 ó´   • U R                  U5      R                  5       n[        R                  " USS9R	                  U5      U-  nUR                  5       U-   $ )zí
Replace non-padding symbols with their position numbers. Position numbers begin at padding_idx+1. Padding symbols
are ignored. This is modified from fairseq's `utils.make_positions`.

Args:
    x: torch.Tensor x:

Returns: torch.Tensor
r   r—   )Úner©   r$   Úcumsumr›   rw   )ry   rU   ÚmaskÚincremental_indicess       r*   rr   rr     sP   € ð <‰<˜Ó$×(Ñ(Ó*€DÜ Ÿ<š<¨°!Ñ4×<Ñ<¸TÓBÀdÑJÐØ×#Ñ#Ó%¨Ñ3Ð3r)   c                   ó8   ^ • \ rS rSrSrU 4S jrS rS rSrU =r	$ )Ú
LukeLMHeadi  z*Roberta Head for masked language modeling.c                 óæ  >• [         TU ]  5         [        R                  " UR                  UR                  5      U l        [        R                  " UR                  UR                  S9U l        [        R                  " UR                  UR                  5      U l
        [        R                  " [        R                  " UR                  5      5      U l        U R                  U R                  l        g ré   )rX   rY   r   r   r\   rê   rc   rd   Ú
layer_normr[   ri  rj  r$   rv   rŒ   rh   s     €r*   rY   ÚLukeLMHead.__init__  s—   ø€ Ü‰ÑÔÜ—Y’Y˜v×1Ñ1°6×3EÑ3EÓFˆŒ
ÜŸ,š, v×'9Ñ'9¸v×?TÑ?TÑUˆŒä—y’y ×!3Ñ!3°V×5FÑ5FÓGˆŒÜ—L’L¤§¢¨V×->Ñ->Ó!?Ó@ˆŒ	Ø ŸI™Iˆ‰Õr)   c                 ó‚   • U R                  U5      n[        U5      nU R                  U5      nU R                  U5      nU$ rŸ   )rê   r   rÁ  ri  )ri   ÚfeaturesÚkwargsr¹   s       r*   r~   ÚLukeLMHead.forward$  s;   € ØJ‰JxÓ ˆÜ‹GˆØO‰O˜AÓˆð L‰L˜‹Oˆàˆr)   c                 óÎ   • U R                   R                  R                  R                  S:X  a  U R                  U R                   l        g U R                   R                  U l        g )NÚmeta)ri  rŒ   rq   Útyper  s    r*   Ú_tie_weightsÚLukeLMHead._tie_weights.  sC   € ð <‰<×Ñ×#Ñ#×(Ñ(¨FÓ2Ø $§	¡	ˆDL‰LÕàŸ™×)Ñ)ˆDIr)   )rŒ   ri  rê   rÁ  )
r   r    r!   r"   r#   rY   r~   rÊ  r(   r†   r‡   s   @r*   r¿  r¿    s   ø† Ù4õ&ò÷*ð *r)   r¿  z—
    The LUKE model with a language modeling head and entity prediction head on top for masked language modeling and
    masked entity prediction.
    c            $       ó  ^ • \ rS rSr/ SQrU 4S jrU 4S jrS rS r\	               SS\
\R                     S\
\R                     S	\
\R                     S
\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\R                     S\
\   S\
\   S\
\   S\\\4   4 S jj5       rSrU =r$ )ÚLukeForMaskedLMi7  )zlm_head.decoder.weightzlm_head.decoder.biasz!entity_predictions.decoder.weightc                 óØ   >• [         TU ]  U5        [        U5      U l        [	        U5      U l        [        U5      U l        [        R                  " 5       U l
        U R                  5         g rŸ   )rX   rY   r„  rp  r¿  Úlm_headrf  Úentity_predictionsr   r   Úloss_fnr‰  rh   s     €r*   rY   ÚLukeForMaskedLM.__init__@  sQ   ø€ Ü‰Ñ˜Ô ä˜fÓ%ˆŒ	ä! &Ó)ˆŒÜ"6°vÓ">ˆÔä×*Ò*Ó,ˆŒð 	‰Õr)   c                 óª   >• [         TU ]  5         U R                  U R                  R                  U R
                  R                  R                  5        g rŸ   )rX   Útie_weightsÚ_tie_or_clone_weightsrÐ  ri  rp  r   )ri   rk   s    €r*   rÔ  ÚLukeForMaskedLM.tie_weightsM  s:   ø€ Ü‰ÑÔØ×"Ñ" 4×#:Ñ#:×#BÑ#BÀDÇIÁI×D_ÑD_×DqÑDqÕrr)   c                 ó.   • U R                   R                  $ rŸ   ©rÏ  ri  r  s    r*   Úget_output_embeddingsÚ%LukeForMaskedLM.get_output_embeddingsQ  s   € Ø|‰|×#Ñ#Ð#r)   c                 ó$   • XR                   l        g rŸ   rØ  )ri   Únew_embeddingss     r*   Úset_output_embeddingsÚ%LukeForMaskedLM.set_output_embeddingsT  s   € Ø-‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  ÚlabelsÚentity_labelsrÈ   r{   rÉ   rI  rJ  rí   c                 óT  • Ub  UOU R                   R                  nU R                  UUUUUUUUUUUUSS9nSnSnU R                  UR                  5      nU	be  U	R                  UR                  5      n	U R                  UR                  SU R                   R                  5      U	R                  S5      5      nUc  UnSnSnUR                  bn  U R                  UR                  5      nU
bP  U R                  UR                  SU R                   R                  5      U
R                  S5      5      nUc  UnOUU-   nU(       d8  [        S UUUUUUR                  UR                  UR                   4 5       5      $ [#        UUUUUUR                  UR                  UR                   S9$ )a{  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
labels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):
    Labels for computing the masked language modeling loss. Indices should be in `[-100, 0, ...,
    config.vocab_size]` (see `input_ids` docstring) Tokens with indices set to `-100` are ignored (masked), the
    loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`
entity_labels (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Labels for computing the masked language modeling loss. Indices should be in `[-100, 0, ...,
    config.vocab_size]` (see `input_ids` docstring) Tokens with indices set to `-100` are ignored (masked), the
    loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`
NT©ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rÉ   rI  rJ  rn   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú*LukeForMaskedLM.forward.<locals>.<genexpr>±  s"   é € ð ñ	Að ÷ ‘ò	ùrF  )r1   r2   r3   r4   r5   r6   r   r7   )rj   r¤  rp  rÏ  rG  rs   rq   rÑ  r·   r[   r   rÐ  r   r'   r6   r   r7   r/   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rß  rà  rÈ   r{   rÉ   rI  rJ  rã   r1   r2   r4   r3   r5   s                         r*   r~   ÚLukeForMaskedLM.forwardW  sÂ  € ðb &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð  ˆàˆØ—‘˜g×7Ñ7Ó8ˆØÑà—Y‘Y˜vŸ}™}Ó-ˆFØ—|‘| F§K¡K°°D·K±K×4JÑ4JÓ$KÈVÏ[É[ÐY[Ë_Ó]ˆHØ‰|ØàˆØˆØ×+Ñ+Ñ7Ø ×3Ñ3°G×4TÑ4TÓUˆMØÑ(ØŸ<™<¨×(:Ñ(:¸2¸t¿{¹{×?\Ñ?\Ó(]Ð_l×_qÑ_qÐrtÓ_uÓvØ‘<Ø#‘Dà (™?DæÜñ ð ØØØØ!Ø×)Ñ)Ø×0Ñ0Ø×&Ñ&ñ	óó ð ô "ØØØØØ'Ø!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ	
ð 		
r)   )rÐ  rÏ  rÑ  rp  ©NNNNNNNNNNNNNNN)r   r    r!   r"   Ú_tied_weights_keysrY   rÔ  rÙ  rÝ  r   r   r$   r    r%   r¸  r   r'   r/   r~   r(   r†   r‡   s   @r*   rÍ  rÍ  7  s¯  ø† ò qÐõõsò$ò.ð ð 15Ø6:Ø59Ø37Ø15Ø<@Ø<@Ø:>Ø-1Ø48Ø15Ø59Ø,0Ø/3Ø&*ñ!q
à˜E×,Ñ,Ñ-ðq
ð ! ×!2Ñ!2Ñ3ðq
ð ! ×!1Ñ!1Ñ2ð	q
ð
 ˜u×/Ñ/Ñ0ðq
ð ˜U×-Ñ-Ñ.ðq
ð  (¨×(8Ñ(8Ñ9ðq
ð  (¨×(8Ñ(8Ñ9ðq
ð & e×&6Ñ&6Ñ7ðq
ð ˜×)Ñ)Ñ*ðq
ð   × 0Ñ 0Ñ1ðq
ð ˜E×-Ñ-Ñ.ðq
ð   × 1Ñ 1Ñ2ðq
ð $ D™>ðq
ð ' t™nðq
ð  ˜d‘^ð!q
ð" 
ˆuÐ(Ð(Ñ	)ô#q
ó öq
r)   rÍ  zº
    The LUKE model with a classification head on top (a linear layer on top of the hidden state of the first entity
    token) for entity classification tasks, such as Open Entity.
    c            "       óÒ  ^ • \ rS rSrU 4S jr\              SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4S jj5       rSrU =r$ )ÚLukeForEntityClassificationiÌ  c                 ó0  >• [         TU ]  U5        [        U5      U l        UR                  U l        [
        R                  " UR                  5      U l        [
        R                  " UR                  UR                  5      U l        U R                  5         g rŸ   ©rX   rY   r„  rp  Ú
num_labelsr   re   rf   rg   r   r\   Ú
classifierr‰  rh   s     €r*   rY   Ú$LukeForEntityClassification.__init__Ó  si   ø€ Ü‰Ñ˜Ô ä˜fÓ%ˆŒ	à ×+Ñ+ˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒÜŸ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rí   c                 óè  • Ub  UOU R                   R                  nU R                  UUUUUUUUU	U
UUSS9nUR                  SS2SSS24   nU R	                  U5      nU R                  U5      nSnUb™  UR                  UR                  5      nUR                  S:X  a!  [        R                  R                  UU5      nOM[        R                  R                  UR                  S5      UR                  S5      R                  U5      5      nU(       d5  [        S UUUR                   UR"                  UR$                  4 5       5      $ ['        UUUR                   UR"                  UR$                  S9$ )	u˜	  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
labels (`torch.LongTensor` of shape `(batch_size,)` or `(batch_size, num_labels)`, *optional*):
    Labels for computing the classification loss. If the shape is `(batch_size,)`, the cross entropy loss is
    used for the single-label classification. In this case, labels should contain the indices that should be in
    `[0, ..., config.num_labels - 1]`. If the shape is `(batch_size, num_labels)`, the binary cross entropy
    loss is used for the multi-label classification. In this case, labels should only contain `[0, 1]`, where 0
    and 1 indicate false and true, respectively.

Examples:

```python
>>> from transformers import AutoTokenizer, LukeForEntityClassification

>>> tokenizer = AutoTokenizer.from_pretrained("studio-ousia/luke-large-finetuned-open-entity")
>>> model = LukeForEntityClassification.from_pretrained("studio-ousia/luke-large-finetuned-open-entity")

>>> text = "BeyoncÃ© lives in Los Angeles."
>>> entity_spans = [(0, 7)]  # character-based entity span corresponding to "BeyoncÃ©"
>>> inputs = tokenizer(text, entity_spans=entity_spans, return_tensors="pt")
>>> outputs = model(**inputs)
>>> logits = outputs.logits
>>> predicted_class_idx = logits.argmax(-1).item()
>>> print("Predicted class:", model.config.id2label[predicted_class_idx])
Predicted class: person
```NTrâ  r   r   rn   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú6LukeForEntityClassification.forward.<locals>.<genexpr>?  ó   é € ð ápAØ÷ ‘ÚpùrF  ©r1   r4   r6   r   r7   )rj   r¤  rp  r   rg   rí  rs   rq   Úndimr   rÃ   Úcross_entropyÚ binary_cross_entropy_with_logitsr·   r›   r'   r6   r   r7   r9   ©ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rã   Úfeature_vectorr4   r1   s                      r*   r~   Ú#LukeForEntityClassification.forwardß  sm  € ð| &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð  !×9Ñ9º!¸QÂ¸'ÑBˆØŸ™ nÓ5ˆØ—‘ Ó0ˆàˆØÑð —Y‘Y˜vŸ}™}Ó-ˆFØ{‰{˜aÓÜ—}‘}×2Ñ2°6¸6ÓB‘ä—}‘}×EÑEÀfÇkÁkÐRTÃoÐW]×WbÑWbÐceÓWf×WnÑWnÐouÓWvÓwæÜñ à ¨×(=Ñ(=¸w×?[Ñ?[Ð]d×]oÑ]oÑpóó ð ô *ØØØ!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   ©rí  rg   rp  rì  ©NNNNNNNNNNNNNN)r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   r9   r~   r(   r†   r‡   s   @r*   ré  ré  Ì  s}  ø† õ
ð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø.2Ø,0Ø/3Ø&*ñk
à˜E×,Ñ,Ñ-ðk
ð ! ×!2Ñ!2Ñ3ðk
ð ! ×!1Ñ!1Ñ2ð	k
ð
 ˜u×/Ñ/Ñ0ðk
ð ˜U×-Ñ-Ñ.ðk
ð  (¨×(9Ñ(9Ñ:ðk
ð  (¨×(8Ñ(8Ñ9ðk
ð & e×&6Ñ&6Ñ7ðk
ð ˜E×-Ñ-Ñ.ðk
ð   × 1Ñ 1Ñ2ðk
ð ˜×*Ñ*Ñ+ðk
ð $ D™>ðk
ð ' t™nðk
ð ˜d‘^ðk
ð  
ˆuÐ0Ð0Ñ	1ô!k
ó ök
r)   ré  zº
    The LUKE model with a classification head on top (a linear layer on top of the hidden states of the two entity
    tokens) for entity pair classification tasks, such as TACRED.
    c            "       óÒ  ^ • \ rS rSrU 4S jr\              SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4S jj5       rSrU =r$ )ÚLukeForEntityPairClassificationiN  c                 ó8  >• [         TU ]  U5        [        U5      U l        UR                  U l        [
        R                  " UR                  5      U l        [
        R                  " UR                  S-  UR                  S5      U l        U R                  5         g )Nr¶   Frë  rh   s     €r*   rY   Ú(LukeForEntityPairClassification.__init__U  sp   ø€ Ü‰Ñ˜Ô ä˜fÓ%ˆŒ	à ×+Ñ+ˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒÜŸ)š) F×$6Ñ$6¸Ñ$:¸F×<MÑ<MÈuÓUˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rí   c                 ó:  • Ub  UOU R                   R                  nU R                  UUUUUUUUU	U
UUSS9n[        R                  " UR
                  SS2SSS24   UR
                  SS2SSS24   /SS9nU R                  U5      nU R                  U5      nSnUb™  UR                  UR                  5      nUR                  S:X  a!  [        R                  R                  UU5      nOM[        R                  R                  UR                  S5      UR                  S5      R!                  U5      5      nU(       d5  [#        S UUUR$                  UR&                  UR(                  4 5       5      $ [+        UUUR$                  UR&                  UR(                  S	9$ )
uÛ	  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
labels (`torch.LongTensor` of shape `(batch_size,)` or `(batch_size, num_labels)`, *optional*):
    Labels for computing the classification loss. If the shape is `(batch_size,)`, the cross entropy loss is
    used for the single-label classification. In this case, labels should contain the indices that should be in
    `[0, ..., config.num_labels - 1]`. If the shape is `(batch_size, num_labels)`, the binary cross entropy
    loss is used for the multi-label classification. In this case, labels should only contain `[0, 1]`, where 0
    and 1 indicate false and true, respectively.

Examples:

```python
>>> from transformers import AutoTokenizer, LukeForEntityPairClassification

>>> tokenizer = AutoTokenizer.from_pretrained("studio-ousia/luke-large-finetuned-tacred")
>>> model = LukeForEntityPairClassification.from_pretrained("studio-ousia/luke-large-finetuned-tacred")

>>> text = "BeyoncÃ© lives in Los Angeles."
>>> entity_spans = [
...     (0, 7),
...     (17, 28),
... ]  # character-based entity spans corresponding to "BeyoncÃ©" and "Los Angeles"
>>> inputs = tokenizer(text, entity_spans=entity_spans, return_tensors="pt")
>>> outputs = model(**inputs)
>>> logits = outputs.logits
>>> predicted_class_idx = logits.argmax(-1).item()
>>> print("Predicted class:", model.config.id2label[predicted_class_idx])
Predicted class: per:cities_of_residence
```NTrâ  r   r   r—   rn   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú:LukeForEntityPairClassification.forward.<locals>.<genexpr>Æ  rò  rF  ró  )rj   r¤  rp  r$   r¾   r   rg   rí  rs   rq   rô  r   rÃ   rõ  rö  r·   r›   r'   r6   r   r7   r?   r÷  s                      r*   r~   Ú'LukeForEntityPairClassification.forwarda  s˜  € ðB &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆô  ŸšØ×-Ñ-ªa°²A¨gÑ6¸×8XÑ8XÒYZÐ\]Ò_`ÐY`Ñ8aÐbÐhiñ
ˆð Ÿ™ nÓ5ˆØ—‘ Ó0ˆàˆØÑð —Y‘Y˜vŸ}™}Ó-ˆFØ{‰{˜aÓÜ—}‘}×2Ñ2°6¸6ÓB‘ä—}‘}×EÑEÀfÇkÁkÐRTÃoÐW]×WbÑWbÐceÓWf×WnÑWnÐouÓWvÓwæÜñ à ¨×(=Ñ(=¸w×?[Ñ?[Ð]d×]oÑ]oÑpóó ð ô .ØØØ!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   rú  rû  )r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   r?   r~   r(   r†   r‡   s   @r*   rý  rý  N  s}  ø† õ
ð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø-1Ø,0Ø/3Ø&*ñp
à˜E×,Ñ,Ñ-ðp
ð ! ×!2Ñ!2Ñ3ðp
ð ! ×!1Ñ!1Ñ2ð	p
ð
 ˜u×/Ñ/Ñ0ðp
ð ˜U×-Ñ-Ñ.ðp
ð  (¨×(9Ñ(9Ñ:ðp
ð  (¨×(8Ñ(8Ñ9ðp
ð & e×&6Ñ&6Ñ7ðp
ð ˜E×-Ñ-Ñ.ðp
ð   × 1Ñ 1Ñ2ðp
ð ˜×)Ñ)Ñ*ðp
ð $ D™>ðp
ð ' t™nðp
ð ˜d‘^ðp
ð  
ˆuÐ4Ð4Ñ	5ô!p
ó öp
r)   rý  z£
    The LUKE model with a span classification head on top (a linear layer on top of the hidden states output) for tasks
    such as named entity recognition.
    c            &       ó  ^ • \ rS rSrU 4S jr\                SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4"S jj5       rSrU =r$ )ÚLukeForEntitySpanClassificationiÕ  c                 ó6  >• [         TU ]  U5        [        U5      U l        UR                  U l        [
        R                  " UR                  5      U l        [
        R                  " UR                  S-  UR                  5      U l        U R                  5         g )Nr
   rë  rh   s     €r*   rY   Ú(LukeForEntitySpanClassification.__init__Ü  sn   ø€ Ü‰Ñ˜Ô ä˜fÓ%ˆŒ	à ×+Ñ+ˆŒÜ—z’z &×"<Ñ"<Ó=ˆŒÜŸ)š) F×$6Ñ$6¸Ñ$:¸F×<MÑ<MÓNˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  Úentity_start_positionsÚentity_end_positionsrÈ   r{   rß  rÉ   rI  rJ  rí   c                 ó¼  • Ub  UOU R                   R                  nU R                  UUUUUUUUUUUUSS9nUR                  R	                  S5      nU	R                  S5      R                  SSU5      n	U	R                  UR                  R                  :w  a%  U	R                  UR                  R                  5      n	[        R                  " UR                  SU	5      nU
R                  S5      R                  SSU5      n
U
R                  UR                  R                  :w  a%  U
R                  UR                  R                  5      n
[        R                  " UR                  SU
5      n[        R                  " UUUR                  /SS9nU R                  U5      nU R                  U5      nSnUbÂ  UR                  UR                  5      nUR                  S:X  aJ  [         R"                  R%                  UR'                  SU R(                  5      UR'                  S5      5      nOM[         R"                  R+                  UR'                  S5      UR'                  S5      R-                  U5      5      nU(       d5  [/        S UUUR0                  UR2                  UR4                  4 5       5      $ [7        UUUR0                  UR2                  UR4                  S	9$ )
uŽ  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
entity_start_positions (`torch.LongTensor`):
    The start positions of entities in the word token sequence.
entity_end_positions (`torch.LongTensor`):
    The end positions of entities in the word token sequence.
labels (`torch.LongTensor` of shape `(batch_size, entity_length)` or `(batch_size, entity_length, num_labels)`, *optional*):
    Labels for computing the classification loss. If the shape is `(batch_size, entity_length)`, the cross
    entropy loss is used for the single-label classification. In this case, labels should contain the indices
    that should be in `[0, ..., config.num_labels - 1]`. If the shape is `(batch_size, entity_length,
    num_labels)`, the binary cross entropy loss is used for the multi-label classification. In this case,
    labels should only contain `[0, 1]`, where 0 and 1 indicate false and true, respectively.

Examples:

```python
>>> from transformers import AutoTokenizer, LukeForEntitySpanClassification

>>> tokenizer = AutoTokenizer.from_pretrained("studio-ousia/luke-large-finetuned-conll-2003")
>>> model = LukeForEntitySpanClassification.from_pretrained("studio-ousia/luke-large-finetuned-conll-2003")

>>> text = "BeyoncÃ© lives in Los Angeles"
# List all possible entity spans in the text

>>> word_start_positions = [0, 8, 14, 17, 21]  # character-based start positions of word tokens
>>> word_end_positions = [7, 13, 16, 20, 28]  # character-based end positions of word tokens
>>> entity_spans = []
>>> for i, start_pos in enumerate(word_start_positions):
...     for end_pos in word_end_positions[i:]:
...         entity_spans.append((start_pos, end_pos))

>>> inputs = tokenizer(text, entity_spans=entity_spans, return_tensors="pt")
>>> outputs = model(**inputs)
>>> logits = outputs.logits
>>> predicted_class_indices = logits.argmax(-1).squeeze().tolist()
>>> for span, predicted_class_idx in zip(entity_spans, predicted_class_indices):
...     if predicted_class_idx != 0:
...         print(text[span[0] : span[1]], model.config.id2label[predicted_class_idx])
BeyoncÃ© PER
Los Angeles LOC
```NTrâ  rn   r–   r¶   r—   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú:LukeForEntitySpanClassification.forward.<locals>.<genexpr>e  rò  rF  ró  )rj   r¤  rp  rG  ru   r‚   rƒ   rq   rs   r$   Úgatherr¾   r   rg   rí  rô  r   rÃ   rõ  r·   rì  rö  r›   r'   r6   r   r7   rB   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  r  r	  rÈ   r{   rß  rÉ   rI  rJ  rã   r\   Ústart_statesÚ
end_statesrø  r4   r1   s                           r*   r~   Ú'LukeForEntitySpanClassification.forwardè  sŠ  € ð^ &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð ×/Ñ/×4Ñ4°RÓ8ˆà!7×!AÑ!AÀ"Ó!E×!LÑ!LÈRÐQSÐU`Ó!aÐØ!×(Ñ(¨G×,EÑ,E×,LÑ,LÓLØ%;×%>Ñ%>¸w×?XÑ?X×?_Ñ?_Ó%`Ð"Ü—|’| G×$=Ñ$=¸rÐCYÓZˆà3×=Ñ=¸bÓA×HÑHÈÈRÐQ\Ó]ÐØ×&Ñ&¨'×*CÑ*C×*JÑ*JÓJØ#7×#:Ñ#:¸7×;TÑ;T×;[Ñ;[Ó#\Ð Ü—\’\ '×";Ñ";¸RÐAUÓVˆ
äŸš L°*¸g×>^Ñ>^Ð#_ÐefÑgˆàŸ™ nÓ5ˆØ—‘ Ó0ˆàˆØÑà—Y‘Y˜vŸ}™}Ó-ˆFð {‰{˜aÓÜ—}‘}×2Ñ2°6·;±;¸rÀ4Ç?Á?Ó3SÐU[×U`ÑU`ÐacÓUdÓe‘ä—}‘}×EÑEÀfÇkÁkÐRTÃoÐW]×WbÑWbÐceÓWf×WnÑWnÐouÓWvÓwæÜñ à ¨×(=Ñ(=¸w×?[Ñ?[Ð]d×]oÑ]oÑpóó ð ô .ØØØ!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   rú  )NNNNNNNNNNNNNNNN)r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   rB   r~   r(   r†   r‡   s   @r*   r  r  Õ  s¯  ø† õ
ð ð 15Ø6:Ø59Ø37Ø15Ø<@Ø<@Ø:>Ø=AØ;?Ø15Ø59Ø-1Ø,0Ø/3Ø&*ñ#H
à˜E×,Ñ,Ñ-ðH
ð ! ×!2Ñ!2Ñ3ðH
ð ! ×!1Ñ!1Ñ2ð	H
ð
 ˜u×/Ñ/Ñ0ðH
ð ˜U×-Ñ-Ñ.ðH
ð  (¨×(8Ñ(8Ñ9ðH
ð  (¨×(8Ñ(8Ñ9ðH
ð & e×&6Ñ&6Ñ7ðH
ð !)¨×)9Ñ)9Ñ :ðH
ð ' u×'7Ñ'7Ñ8ðH
ð ˜E×-Ñ-Ñ.ðH
ð   × 1Ñ 1Ñ2ðH
ð ˜×)Ñ)Ñ*ðH
ð $ D™>ðH
ð  ' t™nð!H
ð" ˜d‘^ð#H
ð$ 
ˆuÐ4Ð4Ñ	5ô%H
ó öH
r)   r  z 
    The LUKE Model transformer with a sequence classification/regression head on top (a linear layer on top of the
    pooled output) e.g. for GLUE tasks.
    c            "       óÒ  ^ • \ rS rSrU 4S jr\              SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4S jj5       rSrU =r$ )ÚLukeForSequenceClassificationit  c                 ób  >• [         TU ]  U5        UR                  U l        [        U5      U l        [
        R                  " UR                  b  UR                  OUR                  5      U l	        [
        R                  " UR                  UR                  5      U l        U R                  5         g rŸ   ©rX   rY   rì  r„  rp  r   re   Úclassifier_dropoutrf   rg   r   r\   rí  r‰  rh   s     €r*   rY   Ú&LukeForSequenceClassification.__init__{  s‚   ø€ Ü‰Ñ˜Ô Ø ×+Ñ+ˆŒÜ˜fÓ%ˆŒ	Ü—z’zØ)/×)BÑ)BÑ)NˆF×%Ò%ÐTZ×TnÑTnó
ˆŒô Ÿ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rí   c                 óú  • Ub  UOU R                   R                  nU R                  UUUUUUUUU	U
UUSS9nUR                  nU R	                  U5      nU R                  U5      nSnUGb«  UR                  UR                  5      nU R                   R                  c‘  U R                  S:X  a  SU R                   l        OoU R                  S:”  aN  UR                  [        R                  :X  d  UR                  [        R                  :X  a  SU R                   l        OSU R                   l        U R                   R                  S:X  aJ  [        5       nU R                  S:X  a&  U" UR                  5       UR                  5       5      nOŽU" UU5      nO„U R                   R                  S:X  a=  [!        5       nU" UR#                  SU R                  5      UR#                  S5      5      nO-U R                   R                  S:X  a  [%        5       nU" UU5      nU(       d5  ['        S	 UUUR(                  UR*                  UR,                  4 5       5      $ [/        UUUR(                  UR*                  UR,                  S
9$ )aè  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
labels (`torch.LongTensor` of shape `(batch_size,)`, *optional*):
    Labels for computing the sequence classification/regression loss. Indices should be in `[0, ...,
    config.num_labels - 1]`. If `config.num_labels == 1` a regression loss is computed (Mean-Square loss), If
    `config.num_labels > 1` a classification loss is computed (Cross-Entropy).
NTrâ  r   Ú
regressionÚsingle_label_classificationÚmulti_label_classificationrn   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú8LukeForSequenceClassification.forward.<locals>.<genexpr>ã  rò  rF  ró  )rj   r¤  rp  r£  rg   rí  rs   rq   Úproblem_typerì  rp   r$   rw   r©   r	   Úsqueezer   r·   r   r'   r6   r   r7   rE   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rã   r\  r4   r1   Úloss_fcts                       r*   r~   Ú%LukeForSequenceClassification.forward‡  s#  € ðV &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð   ×-Ñ-ˆàŸ™ ]Ó3ˆØ—‘ Ó/ˆàˆØÒà—Y‘Y˜vŸ}™}Ó-ˆFØ{‰{×'Ñ'Ñ/Ø—?‘? aÓ'Ø/;D—K‘KÕ,Ø—_‘_ qÓ(¨f¯l©l¼e¿j¹jÓ.HÈFÏLÉLÔ\a×\eÑ\eÓLeØ/LD—K‘KÕ,à/KD—K‘KÔ,à{‰{×'Ñ'¨<Ó7Ü"›9Ø—?‘? aÓ'Ù# F§N¡NÓ$4°f·n±nÓ6FÓG‘Dá# F¨FÓ3‘DØ—‘×)Ñ)Ð-JÓJÜ+Ó-Ù §¡¨B°·±Ó @À&Ç+Á+ÈbÃ/ÓR‘Ø—‘×)Ñ)Ð-IÓIÜ,Ó.Ù ¨Ó/æÜñ à ¨×(=Ñ(=¸w×?[Ñ?[Ð]d×]oÑ]oÑpóó ð ô ,ØØØ!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   rú  rû  )r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   rE   r~   r(   r†   r‡   s   @r*   r  r  t  s}  ø† õ
ð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø.2Ø,0Ø/3Ø&*ñg
à˜E×,Ñ,Ñ-ðg
ð ! ×!2Ñ!2Ñ3ðg
ð ! ×!1Ñ!1Ñ2ð	g
ð
 ˜u×/Ñ/Ñ0ðg
ð ˜U×-Ñ-Ñ.ðg
ð  (¨×(9Ñ(9Ñ:ðg
ð  (¨×(8Ñ(8Ñ9ðg
ð & e×&6Ñ&6Ñ7ðg
ð ˜E×-Ñ-Ñ.ðg
ð   × 1Ñ 1Ñ2ðg
ð ˜×*Ñ*Ñ+ðg
ð $ D™>ðg
ð ' t™nðg
ð ˜d‘^ðg
ð  
ˆuÐ2Ð2Ñ	3ô!g
ó ög
r)   r  zú
    The LUKE Model with a token classification head on top (a linear layer on top of the hidden-states output). To
    solve Named-Entity Recognition (NER) task using LUKE, `LukeForEntitySpanClassification` is more suitable than this
    class.
    c            "       óÒ  ^ • \ rS rSrU 4S jr\              SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4S jj5       rSrU =r$ )ÚLukeForTokenClassificationiò  c                 ó`  >• [         TU ]  U5        UR                  U l        [        USS9U l        [
        R                  " UR                  b  UR                  OUR                  5      U l	        [
        R                  " UR                  UR                  5      U l        U R                  5         g ©NF)r…  r  rh   s     €r*   rY   Ú#LukeForTokenClassification.__init__ú  s„   ø€ Ü‰Ñ˜Ô Ø ×+Ñ+ˆŒä˜f¸Ñ>ˆŒ	Ü—z’zØ)/×)BÑ)BÑ)NˆF×%Ò%ÐTZ×TnÑTnó
ˆŒô Ÿ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rí   c                 óP  • Ub  UOU R                   R                  nU R                  UUUUUUUUU	U
UUSS9nUR                  nU R	                  U5      nU R                  U5      nSnUbW  UR                  UR                  5      n[        5       nU" UR                  SU R                  5      UR                  S5      5      nU(       d5  [        S UUUR                  UR                  UR                  4 5       5      $ [        UUUR                  UR                  UR                  S9$ )a¥  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
labels (`torch.LongTensor` of shape `(batch_size,)`, *optional*):
    Labels for computing the multiple choice classification loss. Indices should be in `[0, ...,
    num_choices-1]` where `num_choices` is the size of the second dimension of the input tensors. (See
    `input_ids` above)
NTrâ  rn   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú5LukeForTokenClassification.forward.<locals>.<genexpr>Q  rò  rF  ró  )rj   r¤  rp  rG  rg   rí  rs   rq   r   r·   rì  r'   r6   r   r7   rH   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rã   r°  r4   r1   r  s                       r*   r~   Ú"LukeForTokenClassification.forward  s1  € ðV &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð  "×3Ñ3ˆàŸ,™, Ó7ˆØ—‘ Ó1ˆàˆØÑà—Y‘Y˜vŸ}™}Ó-ˆFÜ'Ó)ˆHÙ˜FŸK™K¨¨D¯O©OÓ<¸f¿k¹kÈ"»oÓNˆDæÜñ à ¨×(=Ñ(=¸w×?[Ñ?[Ð]d×]oÑ]oÑpóó ð ô )ØØØ!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   rú  rû  )r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   rH   r~   r(   r†   r‡   s   @r*   r"  r"  ò  s}  ø† õð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø.2Ø,0Ø/3Ø&*ñU
à˜E×,Ñ,Ñ-ðU
ð ! ×!2Ñ!2Ñ3ðU
ð ! ×!1Ñ!1Ñ2ð	U
ð
 ˜u×/Ñ/Ñ0ðU
ð ˜U×-Ñ-Ñ.ðU
ð  (¨×(9Ñ(9Ñ:ðU
ð  (¨×(8Ñ(8Ñ9ðU
ð & e×&6Ñ&6Ñ7ðU
ð ˜E×-Ñ-Ñ.ðU
ð   × 1Ñ 1Ñ2ðU
ð ˜×*Ñ*Ñ+ðU
ð $ D™>ðU
ð ' t™nðU
ð ˜d‘^ðU
ð  
ˆuÐ/Ð/Ñ	0ô!U
ó öU
r)   r"  c            $       óò  ^ • \ rS rSrU 4S jr\               SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4 S jj5       rSrU =r$ )ÚLukeForQuestionAnsweringi`  c                 óä   >• [         TU ]  U5        UR                  U l        [        USS9U l        [
        R                  " UR                  UR                  5      U l        U R                  5         g r$  )
rX   rY   rì  r„  rp  r   r   r\   Ú
qa_outputsr‰  rh   s     €r*   rY   Ú!LukeForQuestionAnswering.__init__b  sU   ø€ Ü‰Ñ˜Ô à ×+Ñ+ˆŒä˜f¸Ñ>ˆŒ	ÜŸ)š) F×$6Ñ$6¸×8IÑ8IÓJˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   Ústart_positionsÚend_positionsrÉ   rI  rJ  rí   c                 ó\  • Ub  UOU R                   R                  nU R                  UUUUUUUUU	U
UUSS9nUR                  nU R	                  U5      nUR                  SSS9u  nnUR                  S5      nUR                  S5      nSnUb·  Ub´  [        UR                  5       5      S:”  a  UR                  S5      n[        UR                  5       5      S:”  a  UR                  S5      nUR                  S5      nUR                  SU5        UR                  SU5        [        US9nU" UU5      nU" UU5      nUU-   S	-  nU(       d6  [        S
 UUUUR                  UR                  UR                  4 5       5      $ [        UUUUR                  UR                  UR                  S9$ )a„  
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
NTrâ  r   rn   r—   r   )Úignore_indexr¶   c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú3LukeForQuestionAnswering.forward.<locals>.<genexpr>À  s"   é € ð ñAð ÷ ‘òùrF  )r1   rM   rN   r6   r   r7   )rj   r¤  rp  rG  r-  Úsplitr  Úlenru   Úclamp_r   r'   r6   r   r7   rK   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   r/  r0  rÉ   rI  rJ  rã   r°  r4   rM   rN   Ú
total_lossÚignored_indexr  Ú
start_lossÚend_losss                             r*   r~   Ú LukeForQuestionAnswering.forwardm  sÜ  € ðP &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆà—)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð  "×3Ñ3ˆà—‘ Ó1ˆØ#)§<¡<°°r <Ð#:Ñ ˆjØ#×+Ñ+¨BÓ/ˆØ×'Ñ'¨Ó+ˆ
àˆ
ØÑ&¨=Ñ+Dä?×'Ñ'Ó)Ó*¨QÓ.Ø"1×"9Ñ"9¸"Ó"=Ü=×%Ñ%Ó'Ó(¨1Ó,Ø -× 5Ñ 5°bÓ 9à(×-Ñ-¨aÓ0ˆMØ×"Ñ" 1 mÔ4Ø× Ñ   MÔ2ä'°]ÑCˆHÙ! ,°Ó@ˆJÙ 
¨MÓ:ˆHØ$ xÑ/°1Ñ4ˆJæÜñ ð Ø ØØ×)Ñ)Ø×0Ñ0Ø×&Ñ&ñóó ð ô 0ØØ%Ø!Ø!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   )rp  rì  r-  ræ  )r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   rK   r~   r(   r†   r‡   s   @r*   r+  r+  `  s–  ø† õ	ð ð 15Ø6:Ø59Ø48Ø15Ø=AØ<@Ø:>Ø15Ø59Ø6:Ø48Ø,0Ø/3Ø&*ñ!f
à˜E×,Ñ,Ñ-ðf
ð ! ×!2Ñ!2Ñ3ðf
ð ! ×!1Ñ!1Ñ2ð	f
ð
 ˜u×0Ñ0Ñ1ðf
ð ˜U×-Ñ-Ñ.ðf
ð  (¨×(9Ñ(9Ñ:ðf
ð  (¨×(8Ñ(8Ñ9ðf
ð & e×&6Ñ&6Ñ7ðf
ð ˜E×-Ñ-Ñ.ðf
ð   × 1Ñ 1Ñ2ðf
ð " %×"2Ñ"2Ñ3ðf
ð   × 0Ñ 0Ñ1ðf
ð $ D™>ðf
ð ' t™nðf
ð  ˜d‘^ð!f
ð" 
ˆuÐ6Ð6Ñ	7ô#f
ó öf
r)   r+  c            "       óÒ  ^ • \ rS rSrU 4S jr\              SS\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S\\R                     S	\\R                     S
\\R                     S\\R                     S\\R                     S\\R                     S\\
   S\\
   S\\
   S\\\4   4S jj5       rSrU =r$ )ÚLukeForMultipleChoicei×  c                 ó,  >• [         TU ]  U5        [        U5      U l        [        R
                  " UR                  b  UR                  OUR                  5      U l        [        R                  " UR                  S5      U l        U R                  5         g r#  )rX   rY   r„  rp  r   re   r  rf   rg   r   r\   rí  r‰  rh   s     €r*   rY   ÚLukeForMultipleChoice.__init__Ù  so   ø€ Ü‰Ñ˜Ô ä˜fÓ%ˆŒ	Ü—z’zØ)/×)BÑ)BÑ)NˆF×%Ò%ÐTZ×TnÑTnó
ˆŒô Ÿ)š) F×$6Ñ$6¸Ó:ˆŒð 	‰Õr)   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  rí   c                 óP  • Ub  UOU R                   R                  nUb  UR                  S   OU
R                  S   nUb!  UR                  SUR	                  S5      5      OSnUb!  UR                  SUR	                  S5      5      OSnUb!  UR                  SUR	                  S5      5      OSnUb!  UR                  SUR	                  S5      5      OSnU
b1  U
R                  SU
R	                  S5      U
R	                  S5      5      OSn
Ub!  UR                  SUR	                  S5      5      OSnUb!  UR                  SUR	                  S5      5      OSnUb!  UR                  SUR	                  S5      5      OSnUb1  UR                  SUR	                  S5      UR	                  S5      5      OSnU R                  UUUUUUUUU	U
UUSS9nUR                  nU R                  U5      nU R                  U5      nUR                  SU5      nSnUb.  UR                  UR                  5      n[        5       nU" UU5      nU(       d5  [        S UUUR                  UR                  UR                  4 5       5      $ [!        UUUR                  UR                  UR                  S9$ )	a  
input_ids (`torch.LongTensor` of shape `(batch_size, num_choices, sequence_length)`):
    Indices of input sequence tokens in the vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.

    [What are input IDs?](../glossary#input-ids)
token_type_ids (`torch.LongTensor` of shape `(batch_size, num_choices, sequence_length)`, *optional*):
    Segment token indices to indicate first and second portions of the inputs. Indices are selected in `[0,
    1]`:

    - 0 corresponds to a *sentence A* token,
    - 1 corresponds to a *sentence B* token.

    [What are token type IDs?](../glossary#token-type-ids)
position_ids (`torch.LongTensor` of shape `(batch_size, num_choices, sequence_length)`, *optional*):
    Indices of positions of each input sequence tokens in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.

    [What are position IDs?](../glossary#position-ids)
entity_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`):
    Indices of entity tokens in the entity vocabulary.

    Indices can be obtained using [`AutoTokenizer`]. See [`PreTrainedTokenizer.encode`] and
    [`PreTrainedTokenizer.__call__`] for details.
entity_attention_mask (`torch.FloatTensor` of shape `(batch_size, entity_length)`, *optional*):
    Mask to avoid performing attention on padding entity token indices. Mask values selected in `[0, 1]`:

    - 1 for entity tokens that are **not masked**,
    - 0 for entity tokens that are **masked**.
entity_token_type_ids (`torch.LongTensor` of shape `(batch_size, entity_length)`, *optional*):
    Segment token indices to indicate first and second portions of the entity token inputs. Indices are
    selected in `[0, 1]`:

    - 0 corresponds to a *portion A* entity token,
    - 1 corresponds to a *portion B* entity token.
entity_position_ids (`torch.LongTensor` of shape `(batch_size, entity_length, max_mention_length)`, *optional*):
    Indices of positions of each input entity in the position embeddings. Selected in the range `[0,
    config.max_position_embeddings - 1]`.
inputs_embeds (`torch.FloatTensor` of shape `(batch_size, num_choices, sequence_length, hidden_size)`, *optional*):
    Optionally, instead of passing `input_ids` you can choose to directly pass an embedded representation. This
    is useful if you want more control over how to convert `input_ids` indices into associated vectors than the
    model's internal embedding lookup matrix.
labels (`torch.LongTensor` of shape `(batch_size,)`, *optional*):
    Labels for computing the multiple choice classification loss. Indices should be in `[0, ...,
    num_choices-1]` where `num_choices` is the size of the second dimension of the input tensors. (See
    `input_ids` above)
Nr   rn   r–   Trâ  c              3   ó.   #   • U H  nUc  M  Uv •  M     g 7frŸ   r   r@  s     r*   rC  Ú0LukeForMultipleChoice.forward.<locals>.<genexpr>d  rE  rF  ró  )rj   r¤  rµ  r·   ru   rp  r£  rg   rí  rs   rq   r   r'   r6   r   r7   rP   )ri   ry   rÇ   rz   rx   r“   rŸ  r   r¡  rÈ   r{   rß  rÉ   rI  rJ  Únum_choicesrã   r\  r4   Úreshaped_logitsr1   r  s                         r*   r~   ÚLukeForMultipleChoice.forwardå  sÞ  € ðF &1Ñ%<‘kÀ$Ç+Á+×B]ÑB]ˆØ,5Ñ,Ai—o‘o aÒ(À}×GZÑGZÐ[\ÑG]ˆà>GÑ>SI—N‘N 2 y§~¡~°bÓ'9Ô:ÐY]ˆ	ØM[ÑMg˜×,Ñ,¨R°×1DÑ1DÀRÓ1HÔIÐmqˆØM[ÑMg˜×,Ñ,¨R°×1DÑ1DÀRÓ1HÔIÐmqˆØGSÑG_|×(Ñ(¨¨\×->Ñ->¸rÓ-BÔCÐeiˆð Ñ(ð ×Ñ˜r =×#5Ñ#5°bÓ#9¸=×;MÑ;MÈbÓ;QÔRàð 	ð BLÑAWZ—_‘_ R¨¯©¸Ó)<Ô=Ð]aˆ
ð %Ñ0ð "×&Ñ& rÐ+@×+EÑ+EÀbÓ+IÔJàð 	ð %Ñ0ð "×&Ñ& rÐ+@×+EÑ+EÀbÓ+IÔJàð 	ð #Ñ.ð  ×$Ñ$ RÐ)<×)AÑ)AÀ"Ó)EÐGZ×G_ÑG_Ð`bÓGcÔdàð 	ð —)‘)ØØ)Ø)Ø%Ø!Ø"7Ø"7Ø 3ØØ'Ø/Ø!5Øð ð 
ˆð   ×-Ñ-ˆàŸ™ ]Ó3ˆØ—‘ Ó/ˆØ Ÿ+™+ b¨+Ó6ˆàˆØÑà—Y‘Y˜×5Ñ5Ó6ˆFÜ'Ó)ˆHÙ˜O¨VÓ4ˆDæÜñ 
ð Ø#Ø×)Ñ)Ø×0Ñ0Ø×&Ñ&ñó
ó 
ð 
ô -ØØ"Ø!×/Ñ/Ø!(×!=Ñ!=Ø×)Ñ)ñ
ð 	
r)   )rí  rg   rp  rû  )r   r    r!   r"   rY   r   r   r$   r    r%   r¸  r   r'   rP   r~   r(   r†   r‡   s   @r*   r>  r>  ×  s}  ø† õ
ð ð 15Ø6:Ø59Ø37Ø15Ø=AØ<@Ø:>Ø15Ø59Ø.2Ø,0Ø/3Ø&*ñP
à˜E×,Ñ,Ñ-ðP
ð ! ×!2Ñ!2Ñ3ðP
ð ! ×!1Ñ!1Ñ2ð	P
ð
 ˜u×/Ñ/Ñ0ðP
ð ˜U×-Ñ-Ñ.ðP
ð  (¨×(9Ñ(9Ñ:ðP
ð  (¨×(8Ñ(8Ñ9ðP
ð & e×&6Ñ&6Ñ7ðP
ð ˜E×-Ñ-Ñ.ðP
ð   × 1Ñ 1Ñ2ðP
ð ˜×*Ñ*Ñ+ðP
ð $ D™>ðP
ð ' t™nðP
ð ˜d‘^ðP
ð  
ˆuÐ3Ð3Ñ	4ô!P
ó öP
r)   r>  )
ré  rý  r  r>  r+  r  r"  rÍ  r„  ro  )Gr#   rÁ   Údataclassesr   Útypingr   r   r$   Útorch.utils.checkpointr   Útorch.nnr   r   r	   Úactivationsr   r   Úmodeling_layersr   Úmodeling_outputsr   r   Úmodeling_utilsr   Úpytorch_utilsr   Úutilsr   r   r   Úconfiguration_luker   Ú
get_loggerr   Úloggerr   r,   r/   r9   r?   rB   rE   rH   rK   rP   r‚  rR   r‰   r¢   rç   rø   r  r  r!  r5  rU  r_  rf  ro  r„  rr   r¿  rÍ  ré  rý  r  r  r"  r+  r>  Ú__all__r   r)   r*   Ú<module>rU     s{  ðñ ã Ý !ß "ã Û Ý ß AÑ Aç 'Ý 9ß KÝ -Ý 6ß 9Ñ 9Ý *ð 
×	Ò	˜HÓ	%€ð Ùðñô
IÐ%?ó Ióó ðIð" Ùðñô
I˜/ó Ióó ðIð Ùðñô
?˜ó ?óó ð?ð8 Ùðñô
? ó ?óó ð?ð& Ùðñô
? [ó ?óó ð?ð& Ùðñô
? [ó ?óó ð?ð& Ùðñô
? ;ó ?óó ð?ð& Ùðñô
? ó ?óó ð?ð& Ùðñô
? {ó ?óó ð?ð$ Ùðñô
? Kó ?óó ð?ô*F=R—Y‘Yô F=ôR(˜2Ÿ9™9ô (ôVn˜Ÿ	™	ô nôdR—Y‘Yô ô,B—I‘Iô ,ô`r—y‘yô ô —‘ô ô1Ð*ô 1ôhA
"—)‘)ô A
ôJ—‘ô ô B§I¡Iô ô"˜2Ÿ9™9ô ð ô*˜/ó *ó ð*ñ0 ðñô
Y'Ð#ó Y'óð
Y'òx4ô"*—‘ô *ñ> ðñôL
Ð)ó L
óðL
ñ^ ðñôy
Ð"5ó y
óðy
ñx ðñô~
Ð&9ó ~
óð~
ñB ðñôV
Ð&9ó V
óðV
ñr ðñôu
Ð$7ó u
óðu
ñp ðñôd
Ð!4ó d
óðd
ðN ôs
Ð2ó s
ó ðs
ðl ô^
Ð/ó ^
ó ð^
òBr)   